<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR AI</journal-id>
      <journal-title>JMIR AI</journal-title>
      <issn pub-type="epub">2817-1705</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v2i1e41264</article-id>
      <article-id pub-id-type="pmid">38875552</article-id>
      <article-id pub-id-type="doi">10.2196/41264</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Developing an Inpatient Electronic Medical Record Phenotype for Hospital-Acquired Pressure Injuries: Case Study Using Natural Language Processing Models</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>El Emam</surname>
            <given-names>Khaled</given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Malin</surname>
            <given-names>Bradley</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Ru</surname>
            <given-names>Boshu</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Zhang</surname>
            <given-names>Tianlin</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Nurmambetova</surname>
            <given-names>Elvira</given-names>
          </name>
          <degrees>BHSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Centre for Health Informatics</institution>
            <institution>Cumming School of Medicine</institution>
            <institution>University of Calgary</institution>
            <addr-line>3330 Hospital Dr NW</addr-line>
            <addr-line>Calgary, AB, T2N 4N1</addr-line>
            <country>Canada</country>
            <phone>1 4032206843</phone>
            <email>elvira.nurmambetova@ucalgary.ca</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6391-8714</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Pan</surname>
            <given-names>Jie</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6398-1756</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Zilong</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0239-8959</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Wu</surname>
            <given-names>Guosong</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0440-0784</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>Seungwon</given-names>
          </name>
          <degrees>MPH, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6532-5303</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Southern</surname>
            <given-names>Danielle A</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0006-0033</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Martin</surname>
            <given-names>Elliot A</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5127-4333</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Ho</surname>
            <given-names>Chester</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4238-5506</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>Yuan</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff5" ref-type="aff">5</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2100-9437</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Eastwood</surname>
            <given-names>Cathy A</given-names>
          </name>
          <degrees>RN, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4569-8014</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Centre for Health Informatics</institution>
        <institution>Cumming School of Medicine</institution>
        <institution>University of Calgary</institution>
        <addr-line>Calgary, AB</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Community Health Sciences</institution>
        <institution>Cumming School of Medicine</institution>
        <institution>University of Calgary</institution>
        <addr-line>Calgary, AB</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Alberta Health Services</institution>
        <addr-line>Edmonton, AB</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of Medicine</institution>
        <institution>Faculty of Medicine &#38; Dentistry</institution>
        <institution>University of Alberta</institution>
        <addr-line>Edmonton, AB</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Department of Oncology</institution>
        <institution>University of Calgary</institution>
        <institution>Tom Baker Cancer Centre</institution>
        <addr-line>Calgary, AB</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Department of Surgery</institution>
        <institution>Foothills Medical Centre</institution>
        <institution>University of Calgary</institution>
        <addr-line>Calgary, AB</addr-line>
        <country>Canada</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Elvira Nurmambetova <email>elvira.nurmambetova@ucalgary.ca</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>8</day>
        <month>3</month>
        <year>2023</year>
      </pub-date>
      <volume>2</volume>
      <elocation-id>e41264</elocation-id>
      <history>
        <date date-type="received">
          <day>24</day>
          <month>7</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>5</day>
          <month>10</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>1</day>
          <month>1</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>15</day>
          <month>1</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Elvira Nurmambetova, Jie Pan, Zilong Zhang, Guosong Wu, Seungwon Lee, Danielle A Southern, Elliot A Martin, Chester Ho, Yuan Xu, Cathy A Eastwood. Originally published in JMIR AI (https://ai.jmir.org), 08.03.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR AI, is properly cited. The complete bibliographic information, a link to the original publication on https://www.ai.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://ai.jmir.org/2023/1/e41264" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Surveillance of hospital-acquired pressure injuries (HAPI) is often suboptimal when relying on administrative health data, as International Classification of Diseases (ICD) codes are known to have long delays and are undercoded. We leveraged natural language processing (NLP) applications on free-text notes, particularly the inpatient nursing notes, from electronic medical records (EMRs), to more accurately and timely identify HAPIs.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to show that EMR-based phenotyping algorithms are more fitted to detect HAPIs than ICD-10-CA algorithms alone, while the clinical logs are recorded with higher accuracy via NLP using nursing notes.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Patients with HAPIs were identified from head-to-toe skin assessments in a local tertiary acute care hospital during a clinical trial that took place from 2015 to 2018 in Calgary, Alberta, Canada. Clinical notes documented during the trial were extracted from the EMR database after the linkage with the discharge abstract database. Different combinations of several types of clinical notes were processed by sequential forward selection during the model development. Text classification algorithms for HAPI detection were developed using random forest (RF), extreme gradient boosting (XGBoost), and deep learning models. The classification threshold was tuned to enable the model to achieve similar specificity to an ICD-based phenotyping study. Each model’s performance was assessed, and comparisons were made between the metrics, including sensitivity, positive predictive value, negative predictive value, and <italic>F</italic><sub>1</sub>-score.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Data from 280 eligible patients were used in this study, among whom 97 patients had HAPIs during the trial. RF was the optimal performing model with a sensitivity of 0.464 (95% CI 0.365-0.563), specificity of 0.984 (95% CI 0.965-1.000), and <italic>F</italic><sub>1</sub>-score of 0.612 (95% CI of 0.473-0.751). The machine learning (ML) model reached higher sensitivity without sacrificing much specificity compared to the previously reported performance of ICD-based algorithms.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The EMR-based NLP phenotyping algorithms demonstrated improved performance in HAPI case detection over ICD-10-CA codes alone. Daily generated nursing notes in EMRs are a valuable data resource for ML models to accurately detect adverse events. The study contributes to enhancing automated health care quality and safety surveillance.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>pressure injury</kwd>
        <kwd>natural language processing</kwd>
        <kwd>NLP</kwd>
        <kwd>algorithm</kwd>
        <kwd>phenotype algorithm</kwd>
        <kwd>phenotyping algorithm</kwd>
        <kwd>machine learning</kwd>
        <kwd>electronic medical record</kwd>
        <kwd>EMR</kwd>
        <kwd>pressure sore</kwd>
        <kwd>pressure wound</kwd>
        <kwd>pressure ulcer</kwd>
        <kwd>pressure injuries</kwd>
        <kwd>detect</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Pressure injury (PI), also known as a pressure ulcer, is an injury of the skin and deep tissues caused by external pressures. Annually, PIs affect approximately 250,000 to 500,000 Canadians, with an estimated prevalence of 26.0% in health care institutions [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. Hospital-acquired pressure injuries (HAPIs) are PIs developed during an inpatient hospital stay. HAPIs can significantly extend a patient’s hospitalization length of stay and cause severe secondary complications, such as muscle and profound tissue impairment [<xref ref-type="bibr" rid="ref3">3</xref>]. HAPI is considered mostly preventable, and its prevalence has been reckoned as an acceptable indicator of the quality of care [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. Collecting HAPI status using chart review is time and labor-intensive, thereby not suitable for large-scale population-based applications. Considering all the factors, there is a need for automated ways to accurately and timely identify HAPIs for analyzing large cohort studies that support quality improvement efforts and assisting unit managers with developing reliable patient safety programs. The International Classification of Diseases, 10th Revision, adapted to the Canadian health system (ICD-10-CA), can be used to estimate the prevalence of adverse events from administrative data. However, the coded administrative data are prone to miss positive cases: previous research demonstrated that the sensitivity of the ICD algorithm for identifying HAPI cases is around 30% compared to chart review [<xref ref-type="bibr" rid="ref1">1</xref>]. In addition to the sensitivity issue, ICD codes are not generally assigned with a specific time when diseases occur. Therefore, they are unsuitable for reporting the time when HAPIs occur [<xref ref-type="bibr" rid="ref6">6</xref>]. Thus, there is a need for more accurate HAPI detection.</p>
      <p>Electronic medical records (EMRs) are used to track and organize patient information for efficient treatment of medical conditions in a secure system [<xref ref-type="bibr" rid="ref7">7</xref>]. Free-text clinical notes in EMRs consist of detailed descriptions of patients' conditions and treatment. Additionally, clinical notes are typically written in a continuous manner across patients' interactions with health care systems, making clinical notes more real-time compared to diagnosis codes. Despite the rich information the clinical record may have, coders often cannot read every entry, given their limited time per chart and many patients have prolonged hospital stays. Recent studies suggest that using free-text in EMRs alone, or incorporating EMR data elements, can significantly improve the accuracy of case identification of specific comorbidities [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref16">16</xref>]. Xu et al compared the ICD algorithm with algorithms based on EMR keyword search, which achieved a high sensitivity of 0.655 (95% CI 0.601-0.710) [<xref ref-type="bibr" rid="ref8">8</xref>]. The Canadian health system operates as a publicly funded single-payer insurance system by the federal, provincial, and territorial governments [<xref ref-type="bibr" rid="ref17">17</xref>]. Additional crown institutions at the provincial and federal-level monitor adverse events such as HAPI. For example, in Alberta, Canadian Institute for Health Information, the federal crown corporation, works with Alberta Health Services (provincial health care agency) to monitor PIs [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. To date, there is no mandatory collection of PIs within Canadian acute-care facilities. Real-time PI evaluation and auditing using ICD codes are not possible as Canadian health data systems are set up such that ICD codes are assigned outside of providing care and have a few months lag in data extraction, transfer, and load [<xref ref-type="bibr" rid="ref20">20</xref>]. Consequently, these agencies aim to monitor but are unable to conduct real-time auditing of PIs in Canada. Therefore, there is a need to develop EMR data-specific algorithm for identifying PIs for monitoring and auditing within Canadian acute-care facilities. Our objective was to create EMR data-specific algorithms for HAPIs. Availability and implementation of PI-specific algorithms within a clinical information system would allow the abovementioned federal and provincial agencies to conduct real-time surveillance of HAPIs, improving patient safety, enhancing the quality of care, and reducing the burden of costs associated with adverse events. The EMR phenotype case detection is evaluated via comparison with confirmed HAPIs status acquired in a clinical trial [<xref ref-type="bibr" rid="ref21">21</xref>].</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Study Design</title>
        <p>This is an EMR phenotyping study for enhancing HAPI identification using free-text notes. Obtained clinical trial data were linked to administrative and EMR data for model development and validation. The natural language processing (NLP) method’s performance was compared with results from the ICD validation study conducted in Alberta, Canada, by Wong et al [<xref ref-type="bibr" rid="ref21">21</xref>]. Detailed information for HAPIs identification can be found in their study.</p>
      </sec>
      <sec>
        <title>Clinical Trial Data</title>
        <p>Previously completed randomized controlled trial (RCT) data of 678 eligible consenting inpatients were obtained from an affiliated research team and were used as the reference standard [<xref ref-type="bibr" rid="ref21">21</xref>]. The trial evaluated the efficacy of a pressure-sensing mattress in preventing interface pressure. A research nurse performed a clinical head-to-toe skin assessment for PI formation, and suspected deep tissue injuries were monitored throughout 3 days of enrollment [<xref ref-type="bibr" rid="ref21">21</xref>]. Assessments were conducted within 24 hours of admission, on the day of trial enrollment, and the third day after enrollment, and documented in Allscripts Sunrise Clinical Manager (SCM) EMR (<xref rid="figure1" ref-type="fig">Figure 1</xref>). Three days were chosen as a length of time for the research nurse to perform data collection and risk assessment for 3 reasons. First, this is the average length of stay in the local inpatient units, and a longer trial period may include varying nursing practice due to hospital discharge with a shorter length of stay, unit changes, and more nursing shift changes. Second, the dedicated investigation team deemed 3 days sufficient for pressure-related skin and soft tissue changes to develop. Lastly, as a continuous collection of interface pressure throughout the enrollment period leads to a large volume of data, 3 days allowed for optimal data collection while maintaining participant enrollment.</p>
        <p>The research nurse, who measured pressure-related skin ulcerations, was trained as a wound care specialist in the provision of pressure ulcers, ostomy, and continence care [<xref ref-type="bibr" rid="ref21">21</xref>]. The patients’ PI status check on admission was determined based on when the patient was admitted. The clinical trial team relied on the medical record if the patient had been admitted long before the study and consented to the study. If the patient agreed to participate in the trial right after being admitted to the hospital, the research nurse noted the PI status on admission.</p>
        <p>The following data elements were abstracted from the clinical trial data: record ID, medical unit, sex, first-skin assessment date, second-skin assessment date, presence of PIs, and other possible related conditions (cerebrovascular disease, diabetes mellitus, etc). The clinical trial measured and classified PIs into 6 stages: stage 1, stage 2, stage 3, stage 4, suspected deep tissue injury, and unstageable PIs [<xref ref-type="bibr" rid="ref22">22</xref>]. Stages of PIs were identified according to the National Pressure Ulcer Advisory Panel’s pressure ulcer staging system [<xref ref-type="bibr" rid="ref23">23</xref>]. Stage 1 PIs include sores. Stage 2 captures open wounds on the surface of the skin. Stage 3 PIs represent wounds extending beneath the skin and affecting fat tissue. At stage 4, PIs are deep and reach into muscles, bones, and tendons. The trial is registered at clinicaltrials.gov (NCT02325388). Additional details surrounding the clinical trial data were published by Wong et al [<xref ref-type="bibr" rid="ref21">21</xref>].</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Illustration of the clinical trial for assessment of PI status in the enrolled patient cohort (n=678) and the data input used for the development of classification models. PI: pressure injury.</p>
          </caption>
          <graphic xlink:href="ai_v2i1e41264_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Study Cohort</title>
        <sec>
          <title>Inclusion and Exclusion Criteria</title>
          <p>During the RCT, eligible patients were at least 18 years old, were expected to have a length of stay of at least 3 days, and did not receive near-end-of-life care within 3 days of trial enrollment [<xref ref-type="bibr" rid="ref21">21</xref>]. Participants were recruited from nursing units with a high risk for PI development including acute medical, neurosurgery, neurology, and intensive care [<xref ref-type="bibr" rid="ref21">21</xref>]. For this study, patients were excluded if their data did not link to EMR data, had incomplete skin assessments, or included erroneous assessment or discharge dates. Patients with PIs on the day of admission were also excluded in order to track only PIs developed during hospitalization. Furthermore, intensive care unit (ICU) patients were excluded since their data were stored in another data warehouse with distinct data elements from those found in SCM and required restricted access. After careful selection, the final cohort of eligible patients was 280 (<xref rid="figure2" ref-type="fig">Figure 2</xref>).</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Flowchart of inclusion and exclusion criteria for the patient cohort based on trial completeness, PI status, and age (minimum age of 18 years old) for all controls in the panel. ICU: intensive care unit; PI: pressure injury; SCM: Sunrise Clinical Management.</p>
            </caption>
            <graphic xlink:href="ai_v2i1e41264_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
      <sec>
        <title>Data Linkage to Discharge Abstract Database and SCM EMR</title>
        <p>Deterministic data linkage was performed between the RCT data, administrative data from the discharge abstract database (DAD), and SCM EMR data [<xref ref-type="bibr" rid="ref24">24</xref>]. SCM was the EMR system employed in Calgary hospitals at the time of the study. Data linkage steps followed a previously established methodology [<xref ref-type="bibr" rid="ref25">25</xref>]. First, the PI RCT data were linked to the DAD using the provincial health number and admission date. Then, DAD variables were used to connect these data with SCM.</p>
      </sec>
      <sec>
        <title>Document Types and Sequential Forward Type Feature Selection</title>
        <p>In total, 37 types of documents were noted for the included patients during the clinical trial. Nursing notes were the primary source of suitable HAPI information and constituted the largest proportion of the documents. Among the nursing notes, “Patient Assessment” contained the assessment of skin and wounds under the Integument section. The Integument section described skin integrity, bruises, wound formation, and exposure to air. The “Patient Assessment Neuro” document included the patient's neurological state, where the main components related to PIs were level of consciousness, communication, and sensory deficit. The “Patient Care” document included patients' hygiene, activity, exercise, and nutrition, such as mobility, positioning, and assistance with a meal. The remaining document types contained daily intake and output, physiological indicators, pain scale, and other related data. Discharge summaries, unit transfer notes, and inpatient triage reports were not written for most patients during the clinical trial because the trial was primarily conducted in the middle of the hospital stay.</p>
        <p>Forward feature selection was used to determine the best combination of documents with 2 machine learning (ML) models: extreme gradient boosting (XGBoost) and random forest (RF) [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]. Forward feature selection is an iterative way to obtain the best subset of features [<xref ref-type="bibr" rid="ref28">28</xref>]. The analyses began with no feature in the input of models. Then, in each iteration, new features were added and observed for improvements (<xref rid="figure3" ref-type="fig">Figure 3</xref>). The experiments were run with each feature from the list of all possible features, where the best predictor was then added to our feature set. This iteration ended when introducing a new feature did not significantly improve the targeted metric. In our experiments, the forward feature selection was performed for every document type. Instead of adding 1 feature in each iteration, all documents belonging to 1 type were added to the input of models. This feature selection stopped when adding a new document type did not increase the target metric. Due to the long convergence time, the forward feature selection was not conducted during the development of the deep learning model. Rather, the same optimal document set determined by ML models was used.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>A visual illustration of the sequential forward selection process for identifying feature subsets that maximize the performance of the ML pipeline. The candidate feature subsets were evaluated by using 5-fold cross-validation. For each subset of document types, 40 experiments were conducted with all possible combinations of 5 folds, 2 vectorizers, and 4 ML models. FPR: false positive rate. ML: machine learning; TF-IDF: term frequency-inverse document frequency; TPR: true positive rate.</p>
          </caption>
          <graphic xlink:href="ai_v2i1e41264_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Natural Language Processing</title>
        <sec>
          <title>Bag of Words Preprocessing and ML</title>
          <p>All nursing notes of selected document types were merged into 1 text and converted into a bag-of-words (BOW) vector with the count of words or term frequency-inverse document frequency (TF-IDF) vectorizer by using a Python scikit-learn ML library [<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref31">31</xref>].</p>
          <p>A binary classification model was developed to identify HAPI cases by considering all patients who developed any stage of PI during a hospital stay as positive cases and patients without PIs as the negative cohort. The BOW matrices were used as the independent input for the models. RF and XGBoost classification models were trained to perform classification. These 2 models were chosen because they were representative of ensemble models: RF for bagging and XGboost for boosting. Ensemble models have been shown to display superior performance than a single classifier [<xref ref-type="bibr" rid="ref32">32</xref>]. Two sets of hyperparameters were tried for each model. The 5-fold cross-validation was conducted to determine the most useful document types, high-performing ML model, and its hyperparameters.</p>
        </sec>
        <sec>
          <title>Deep Learning Model</title>
          <p>A hierarchical attention network (HAN) structure with bidirectional encoder representations from transformers (BERT) was used to classify the text in the EMR clinical notes [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]. BERT is a contextualized word representation model that uses a masked language model that predicts randomly masked words in a context sequence. Publicly released BERT parameters are trained on corpora such as Wikipedia, which is formatted differently from clinical text. As such, ClinicalBERT, a language model specifically pretrained using clinical notes, was used for the text evaluation [<xref ref-type="bibr" rid="ref35">35</xref>]. Medical language has been demonstrated to contain vast amounts of discipline-specific jargon, abbreviations, and acronyms while being a domain-specific and technical language [<xref ref-type="bibr" rid="ref36">36</xref>]. Multiple studies have demonstrated that ClinicalBERT performs better than BERT [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. Therefore, the decision to proceed with ClinicalBERT for our study was made. The ClinicalBERT embedding was not fine-tuned with clinical notes data due to a moderate sample size. Rather, the ClinicalBERT was downloaded and tested from a GitHub repo found in the study where Alzentzer et al observed performance improvements on three common clinical NLP tasks after training BERT models on clinical notes and discharge summaries [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref39">39</xref>]. The document embedding layer weights were not taken from ClinicalBERT. As the maximum sequence length of BERT limits it from handling text with more than 512 tokens, sentence embeddings generated by ClinicalBERT are fed to another transformer to obtain the “document embedding,” a highly abstracted vector capturing global information about the whole document [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. HAPI status was classified based on this document embedding (<xref rid="figure4" ref-type="fig">Figure 4</xref>). The project-specific document embedding transformer was trained from the ground up through random initialization. Details of implementation and training of our HAN-BERT models are described in Figure S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>].</p>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>Composition of input sequence representations for text classification using BERT. The meaning of one sentence is summarized into the vector of [CLS] (classifier), an artifact token concatenated at the beginning of each sentence to become the sentence embedding. The sentence embedding is then fed to another transformer to generate the document embedding. An output layer with SoftMax activation provides the probability of text classification. BERT: bidirectional encoder representations from transformers.</p>
            </caption>
            <graphic xlink:href="ai_v2i1e41264_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
      <sec>
        <title>Model Evaluation</title>
        <p>We used 5-fold stratified cross-validation to split the 97 positive cases and 183 patient controls into 5 groups. Due to the fact both numbers were not divisible by 5, there was a minor difference in the distribution of cases and controls between groups, although the effort was placed to retain the most similar distribution between the 5 groups. Each time we selected 4 groups as a training set, the remaining group was used as a test set. The splitting was the same for ML and deep learning experiments. A comparison of different document type subsets was executed with the best model to determine which document type subset would yield the best performance of PI detection. To fairly compare our method with ICD-based PI identification algorithms, the classification threshold was tuned to achieve similarly estimated specificities (0.988 and 0.959) of 2 ICD-based algorithms developed and validated in a previous study by Ho et al [<xref ref-type="bibr" rid="ref1">1</xref>]. The first case definition is more specific and yields greater detection precision. The second definition is more inclusive of nonspecific codes for wounds and is likely to capture a larger number of cases. Sensitivity, specificity, positive predictive value (PPV), negative predictive value (NPV), and <italic>F</italic><sub>1</sub>-scores were calculated as target metrics. Additionally, PPV, NPV, sensitivity, and specificity of the 4 algorithms and 2 ICD algorithms were calculated with changing thresholds ranging from 0.05 to 0.95. <italic>F</italic><sub>1</sub>-score is a measure of accuracy through a combination of sensitivity and PPV. F1 has a maximum score of 1 when both sensitivity and PPV are 1, and a minimum of 0 when either sensitivity or PPV is 0. We calculated the binomial proportion CIs for sensitivity, specificity, PPV, and NPV using the Statsmodels package in Python (<ext-link ext-link-type="uri" xlink:href="https://en.wikipedia.org/wiki/Python_Software_Foundation" xlink:type="simple">Python Software Foundation</ext-link>) [<xref ref-type="bibr" rid="ref42">42</xref>]. The CIs of the <italic>F</italic><sub>1</sub>-score were from 5-fold cross-validation.</p>
      </sec>
      <sec>
        <title>Ethics Approval</title>
        <p>The study was approved by the Conjoint Health Research Ethics Board at the University of Calgary, Calgary, Alberta (REB13-0794).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Characteristics of Study Cohort</title>
        <p>The study included 280 eligible participants (<xref rid="figure2" ref-type="fig">Figure 2</xref>). Among the 280 patients, a research nurse identified 183 patients with no HAPIs, and 97 patients were found to have HAPIs. <xref ref-type="table" rid="table1">Table 1</xref> provides demographic details of the patient cohort. The <italic>P</italic> values were calculated with MedCalc’s statistical calculators [<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>]. The median age was 68 (IQR 55-79) years. The cohort consisted of 127 (45.36%) females, and the median length of stay was 46 (IQR-79) days. A more detailed review of input data and linguistic inquiry and word count analysis for the number of words, sentences, and patients based on document types can be found in Table S1 in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Descriptive statistics of patients (N=280).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="330"/>
            <col width="110"/>
            <col width="230"/>
            <col width="250"/>
            <col width="80"/>
            <thead>
              <tr valign="top">
                <td>Characteristics</td>
                <td>All</td>
                <td>Patients with pressure injury (n=97)</td>
                <td>Patients without pressure injury (n=183)</td>
                <td><italic>P</italic> value</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Female, n (%)</td>
                <td>127 (45.36)</td>
                <td>42 (43.30)</td>
                <td>85 (46.45)</td>
                <td>.62</td>
              </tr>
              <tr valign="top">
                <td>Age (years), median (IQR)</td>
                <td>68 (55-79)</td>
                <td>68 (59-80)</td>
                <td>67 (53-79)</td>
                <td>.10</td>
              </tr>
              <tr valign="top">
                <td>Length of stay (days), median (IQR)</td>
                <td>46 (22-104)</td>
                <td>48 (28-96)</td>
                <td>46 (19-109)</td>
                <td>.37</td>
              </tr>
              <tr valign="top">
                <td>Cerebrovascular disease, n (%)</td>
                <td>137 (48.93)</td>
                <td>50 (51.55)</td>
                <td>87 (47.54)</td>
                <td>.52</td>
              </tr>
              <tr valign="top">
                <td>Chronic obstructive pulmonary disease, n (%)</td>
                <td>54 (19.29)</td>
                <td>26 (26.80)</td>
                <td>28 (15.30)</td>
                <td>.02</td>
              </tr>
              <tr valign="top">
                <td>Congestive heart failure, n (%)</td>
                <td>66 (23.57)</td>
                <td>30 (30.93)</td>
                <td>36 (19.67)</td>
                <td>.04</td>
              </tr>
              <tr valign="top">
                <td>Myocardial infarction, n (%)</td>
                <td>33 (11.79)</td>
                <td>9 (9.28)</td>
                <td>24 (13.11)</td>
                <td>.34</td>
              </tr>
              <tr valign="top">
                <td>Dementia, n (%)</td>
                <td>27 (9.64)</td>
                <td>10 (10.31)</td>
                <td>17 (9.29)</td>
                <td>.79</td>
              </tr>
              <tr valign="top">
                <td>Peripheral vascular disease, n (%)</td>
                <td>51 (18.21)</td>
                <td>21 (21.65)</td>
                <td>30 (16.39)</td>
                <td>.28</td>
              </tr>
              <tr valign="top">
                <td>Hemiplegia or paraplegia, n (%)</td>
                <td>119 (42.50)</td>
                <td>39 (40.21)</td>
                <td>80 (43.72)</td>
                <td>.57</td>
              </tr>
              <tr valign="top">
                <td>Leukemia, n (%)</td>
                <td>2 (0.71)</td>
                <td>1 (1.03)</td>
                <td>1 (0.55)</td>
                <td>.62</td>
              </tr>
              <tr valign="top">
                <td>Lymphoma, n (%)</td>
                <td>4 (1.43)</td>
                <td>2 (2.06)</td>
                <td>2 (1.09)</td>
                <td>.50</td>
              </tr>
              <tr valign="top">
                <td>Peptic ulcer disease, n (%)</td>
                <td>41 (14.64)</td>
                <td>21 (21.65)</td>
                <td>20 (10.93)</td>
                <td>.02</td>
              </tr>
              <tr valign="top">
                <td>Moderate or severe renal disease, n (%)</td>
                <td>55 (19.64)</td>
                <td>28 (28.87)</td>
                <td>27 (14.75)</td>
                <td>.005</td>
              </tr>
              <tr valign="top">
                <td>Liver disease, n (%)</td>
                <td>23 (8.21)</td>
                <td>8 (8.25)</td>
                <td>15 (8.20)</td>
                <td>.99</td>
              </tr>
              <tr valign="top">
                <td>Diabetes mellitus, n (%)</td>
                <td>91 (32.50)</td>
                <td>39 (40.21)</td>
                <td>52 (28.42)</td>
                <td>.045</td>
              </tr>
              <tr valign="top">
                <td>Solid tumor, n (%)</td>
                <td>50 (17.86)</td>
                <td>19 (19.59)</td>
                <td>31 (16.94)</td>
                <td>.58</td>
              </tr>
              <tr valign="top">
                <td>Connective tissue, n (%) disease</td>
                <td>51 (18.21)</td>
                <td>24 (24.74)</td>
                <td>27 (14.75)</td>
                <td>.04</td>
              </tr>
              <tr valign="top">
                <td>History of smoking, n (%)</td>
                <td>118 (42.14)</td>
                <td>45 (46.39)</td>
                <td>73 (39.89)</td>
                <td>.30</td>
              </tr>
              <tr valign="top">
                <td>Currently smoking, n (%)</td>
                <td>37 (13.21)</td>
                <td>11 (11.34)</td>
                <td>26 (14.21)</td>
                <td>.50</td>
              </tr>
              <tr valign="top">
                <td>History of illicit drug use, n (%)</td>
                <td>15 (5.36)</td>
                <td>7 (7.22)</td>
                <td>8 (4.37)</td>
                <td>.32</td>
              </tr>
              <tr valign="top">
                <td>Currently use illicit drugs, n (%)</td>
                <td>8 (2.86)</td>
                <td>3 (3.09)</td>
                <td>5 (2.73)</td>
                <td>.85</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Data Linkage and Extraction</title>
        <p><xref ref-type="table" rid="table2">Table 2</xref> shows the patient and document count and document word count for the patients eligible for this study. Most PI-positive patients had “Patient assessment” document type (60 (61.86%) patients with HAPI versus 82 (44.81%) patients without HAPI), and patients in the negative groups predominantly had “Patient assessment Neuro.” However, patients from both groups had a similar amount of “Patient care” during the trial (<xref ref-type="table" rid="table2">Table 2</xref>).</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Characteristics of extracted documents, different components of nursing notes, and the average number of documents written by nurses.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="340"/>
            <col width="190"/>
            <col width="200"/>
            <col width="240"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Document type</td>
                <td>All (N=280)</td>
                <td>Patients with HAPI (n=97)</td>
                <td>Patients without HAPI (n=183)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="5">
                  <bold>Patient assessment</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Number of patients with this type of document, n (%)</td>
                <td>142 (50.71)</td>
                <td>60 (61.86)</td>
                <td>82 (44.81)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Number of notes per patient, median (IQR)</td>
                <td>1.00 (0.00-17.00)</td>
                <td>12.00 (0.00-18.00)</td>
                <td>0.00 (0.00-16.00)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Word count per note, median (IQR)</td>
                <td>376.00 (306.00-430.00)</td>
                <td>385.00 (311.00-441.00)</td>
                <td>370.00 (303.00-421.00)</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Patient assessment neuro</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Number of patients with this type of document, n (%)</td>
                <td>141 (50.36)</td>
                <td>39 (40.21)</td>
                <td>102 (55.74)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Number of notes per patient, median (IQR)</td>
                <td>2.50 (0.00-13.00)</td>
                <td>0.00 (0.00-13.00)</td>
                <td>8.00 (0.00-13.00)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Word count per note, median (IQR)</td>
                <td>428.00 (343.0-498.0)</td>
                <td>424.00 (324.00-493.50)</td>
                <td>430.00 (346.00-499.00)</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Patient care</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Number of patients with this type of document, n (%)</td>
                <td>280 (100)</td>
                <td>97 (100)</td>
                <td>183(100)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Number of notes per patient, median (IQR)</td>
                <td>16.00 (13.00-21.20)</td>
                <td>16.00 (13.00-19.00)</td>
                <td>16.00 (13.00-23.50)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Word count per note, median (IQR)</td>
                <td>138.00 (72.00-179.00)</td>
                <td>147.00 (91.00-185.00)</td>
                <td>133.00 (66.00-176.00)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Document Subset and Classification Models</title>
        <p>Across a subset of document types and all tested classification techniques, the combination of Patient Assessment, Patient Assessment Neuro, and Patient Care yielded the highest outputs in terms of target metrics.</p>
        <p>The TF-IDF vectorizer with RF classifier demonstrated the best performance in terms of sensitivity, PPV, and NPV when fixed at the specificity of 0.988 and 0.959 thresholds. The performance results are reported in <xref ref-type="table" rid="table3">Table 3</xref>.</p>
        <p>For a specificity of 0.988, the sensitivity of the (TF-IDF+RF) EMR-based model was 0.464 (95% CI 0.365-0.563), which surpassed the sensitivity 0.277 (95% CI 0.174-0.380) achieved by the ICD-based algorithm [<xref ref-type="bibr" rid="ref1">1</xref>]. The PPV of our model had a mean of 0.938 (95% CI 0.869-1.000), which is higher than the reported 0.917 (95 % CI 0.854-0.980) of the ICD algorithm. The NPV was 0.776 (95% CI 0.722-0.830), which is also higher than the 0.739 (95% CI 0.638-0.840) reported in the ICD validation [<xref ref-type="bibr" rid="ref1">1</xref>]. For a specificity of 0.959 achieved by the loose ICD-based algorithm, the EMR model sensitivity reached 0.546 (95% CI 0.447-0.645) compared to 0.328 (95% CI 0.220-0.436) found in ICD reporting [<xref ref-type="bibr" rid="ref1">1</xref>]. Both PPV and NPV of EMR model were also higher (0.855 (95% CI 0.767-0.943) vs 0.793 (95% CI 0.700-0.886) and 0.798 (95% CI 0.745-0.851 vs 0.746 (95% CI 0.646-0.846) than those detected by ICD algorithm respectively. The deep learning model underperformed with the area under the receiver operating characteristic curve (AUC-ROC) score of 0.68 (SD 0.04), compared to the RF with the highest area under the curve (AUC) score of 0.80 (SD 0.08), followed by XGBoost with the AUC score of 0.75 (SD 0.07; <xref rid="figure5" ref-type="fig">Figure 5</xref>). Considering the prevalence of 34.6% in our study, the baseline area under the precision-recall curve (AU-PRC) is 0.346. <xref rid="figure6" ref-type="fig">Figure 6</xref> shows that an AU-PRC of 0.77 (SD 0.06) was achieved for the RF models using TF-IDF tokenization, 0.74 (SD 0.08) was achieved for the RF models using count tokenization, 0.67 (SD 0.04) was achieved for the XGBoost models, and 0.60 (SD 0.06) for the deep learning models. These results are greater than 0.346, and we conclude that these classifiers do not discriminate by random chance and perform well in finding positive HAPI cases without accidentally marking negative patients as positive. Figure S1 in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref> shows the PPV, NPV, sensitivity, and specificity of the 4 algorithms and 2 ICD algorithms, with changing thresholds ranging between 0.05 and 0.95.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>The performance of NLP<sup>a</sup> methods on free-text electronic medical record documents at varying thresholds for the probability of pressure injury detection. The model was compared to ICD<sup>b</sup> algorithms such that the model was trained to mimic its specificity.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="200"/>
            <col width="150"/>
            <col width="150"/>
            <col width="160"/>
            <col width="160"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Model</td>
                <td>Sensitivity % <break/>(95% CI)</td>
                <td>Specificity % <break/>(95% CI)</td>
                <td>PPV<sup>c</sup> % <break/>(95% CI)</td>
                <td>NPV<sup>d</sup> % <break/>(95% CI)</td>
                <td><italic>F</italic><sub>1</sub>-score % <break/>(95% CI)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="7">
                  <bold>Specificity near 0.988</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>ICD (Ho et al [<xref ref-type="bibr" rid="ref1">1</xref>])</td>
                <td>0.277 (0.174-0.380)</td>
                <td>0.988 (0.963-1.013)</td>
                <td>0.917 (0.854-0.980)</td>
                <td>0.739 (0.638-0.840)</td>
                <td>0.425 (0.312-0.538)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>TF-IDF<sup>e</sup>+random forest<sup>f</sup></td>
                <td>0.464 (0.365-0.563)</td>
                <td>0.984 (0.965-1.000)</td>
                <td>0.938 (0.869-1.000)</td>
                <td>0.776 (0.722-0.830)</td>
                <td>0.612 (0.473-0.751)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Count+random forest</td>
                <td>0.412 (0.314-0.510)</td>
                <td>0.978 (0.957-0.999)</td>
                <td>0.909 (0.824-0.994)</td>
                <td>0.758 (0.704-0.813)</td>
                <td>0.550 (0.361-0.739)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>TF-IDF+XGBoost<sup>g</sup></td>
                <td>0.309 (0.217-0.401)</td>
                <td>0.973 (0.949-0.996)</td>
                <td>0.857 (0.741-0.973)</td>
                <td>0.727 (0.671-0.782)</td>
                <td>0.450 (0.340-0.559)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Word Embedding+BERT<sup>h</sup></td>
                <td>0.268 (0.180-0.356)</td>
                <td>0.978 (0.957-0.999)</td>
                <td>0.867 (0.745-0.988)</td>
                <td>0.716 (0.660-0.772)</td>
                <td>0.394 (0.207-0.580)</td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Specificity near 0.959</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>ICD (Ho et al [<xref ref-type="bibr" rid="ref1">1</xref>])</td>
                <td>0.328 (0.220-0.436)</td>
                <td>0.959 (0.913-0.100)</td>
                <td>0.793 (0.700-0.886)</td>
                <td>0.746 (0.646-0.846)</td>
                <td>0.464 (0.350-0.578)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>TF-IDF+random forest</td>
                <td>0.546 (0.447-0.645)</td>
                <td>0.951 (0.919-0.982)</td>
                <td>0.855 (0.767-0.943)</td>
                <td>0.798 (0.745-0.851)</td>
                <td>0.665 (0.577-0.753)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Count+random forest</td>
                <td>0.423 (0.324-0.521)</td>
                <td>0.956 (0.927 -0.986)</td>
                <td>0.837 (0.733-0.940)</td>
                <td>0.758 (0.702-0.813)</td>
                <td>0.546 (0.359-0.733)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>TF-IDF+XGBoost</td>
                <td>0.423 (0.324-0.521)</td>
                <td>0.956 (0.927-0.986)</td>
                <td>0.837 (0.733-0.940)</td>
                <td>0.758 (0.702-0.813)</td>
                <td>0.552 (0.404-0.699)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Word embedding+BERT</td>
                <td>0.289 (0.198-0.379)</td>
                <td>0.967 (0.941-0.993)</td>
                <td>0.824 (0.695-0.952)</td>
                <td>0.720 (0.663-0.776)</td>
                <td>0.420 (0.280-0.560)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>NLP: natural language processing.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>ICD: International Classification of Diseases.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>PPV: positive predictive value.</p>
            </fn>
            <fn id="table3fn4">
              <p><sup>d</sup>NPV: negative predictive value.</p>
            </fn>
            <fn id="table3fn5">
              <p><sup>e</sup>TF-IDF: term frequency-inverse document frequency.</p>
            </fn>
            <fn id="table3fn6">
              <p><sup>f</sup>The best model<italic>.</italic></p>
            </fn>
            <fn id="table3fn7">
              <p><sup>g</sup>XGBoost: extreme gradient boosting.</p>
            </fn>
            <fn id="table3fn8">
              <p><sup>h</sup>BERT: bidirectional encoder representations from transformers.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>The ROC curves derived from the random forest with TF-IDF and word count, XGBoost, and deep learning models. AUC: area under the curve; ROC: receiver operating characteristic; TF-IDF: term frequency-inverse document frequency; XGBoost: eXtreme gradient boosting. </p>
          </caption>
          <graphic xlink:href="ai_v2i1e41264_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>The area under the precision-recall curve (AU-PRC) performance of 4 models: random forest with TF-IDF and word count, XGBoost, deep learning model. AUC: area under the curve; PRC: precision-recall curve; TF-IDF: term frequency-inverse document frequency; XGBoost: eXtreme gradient boosting; </p>
          </caption>
          <graphic xlink:href="ai_v2i1e41264_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Multiple methods were applied, and different combinations of clinical text were analyzed to determine the efficiency of NLP models in detecting HAPIs from nursing notes. The results of NLP models were compared with the ICD-based algorithm reported in the previous study [<xref ref-type="bibr" rid="ref1">1</xref>]. An AUC of 0.80 (SD 0.07) of the ML model indicates fair accuracy in terms of produced sensitivity and specificity. The results demonstrate that different combinations of EMR data leverage NLP models to improve upon ICD-10–based HAPI case definitions. The TF-IDF with RF produced higher sensitivity at a strict specificity level. The satisfactory performance of ML models indicates that the free-text documented during hospitalization contains valuable information for HAPI detection. Developing algorithms using EMR data will facilitate the timely and accurate capture of HAPI incidences and measure the quality of nursing practice during patient hospitalization.</p>
        <p>From the forward document type selection, we found that apart from the notes that directly document skin conditions in the patient assessment, the entries noting the patient’s consciousness, nutrition, and mobility were helpful in indicating HAPI. This makes clinical sense because the reduced level of consciousness, nutrition, and mobility are factors that may contribute to HAPI [<xref ref-type="bibr" rid="ref45">45</xref>]. In addition, our findings align with several risk factors of the Braden Scale [<xref ref-type="bibr" rid="ref46">46</xref>]. Given that many factors of the Braden Scale are documented in nursing notes daily, it may be promising to use NLP to automatically extract the Braden Scale’s factors and achieve better PI detection or prediction upon the automatically rated Braden Scale [<xref ref-type="bibr" rid="ref46">46</xref>].</p>
        <p>The results showed that the XGBoost and RF methods perform better than the advanced deep learning models by a large margin. The joint effort of the TF-IDF vectorizer and tree-based classifier enabled the pipeline to stay robust to irrelevant vocabularies, even when the sample size was smaller than the feature size. The feature selection played a role in this task because a great part of the text in clinical documents was not relevant to HAPIs and only contributed noise for the classification task. On the other hand, deep learning models allowed every input word to contribute to the document embedding upon which the model judged the presence of HAPIs. The suboptimal performance of the deep learning model may have been avoided if the transformers' attention mechanisms had more training samples to converge. The noisy data and not a very large sample size were possibly the main factors that made the deep learning models perform poorly. However, this hypothesis needs further examination.</p>
        <p>Compared to these previous studies that used EMR to automate phenotyping, our model achieved higher sensitivity while reporting comparable values for performance metrics such as PPV and NPV. Furthermore, our model can identify HAPIs with high specificity and improved sensitivity during the first three days in routine clinical practice settings. Melton et al [<xref ref-type="bibr" rid="ref47">47</xref>] found NLP to be reliable and effective in detecting 16 out of 65 adverse events in 1000 manually reviewed charts. The model by Melton et al [<xref ref-type="bibr" rid="ref47">47</xref>] then processed all inpatient cases with EMR discharge summaries, achieving high specificity (0.9996) and low sensitivity (0.28). Our model results are in line with other studies that used free-text clinical notes to predict incidences of distinct adverse events [<xref ref-type="bibr" rid="ref48">48</xref>-<xref ref-type="bibr" rid="ref51">51</xref>].</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>The study is not without limitations. First, the exclusion of ICU patients due to data elements being distinct from SCM led to a smaller sample size and a narrower clinical cohort. Nevertheless, the remaining data from the clinical trial represented a population at risk for HAPIs. Second, both the patient and nurse knew at the admission of a clinical trial measuring PI would be the trial goal, which may have impacted the data entry quality of PI and frequency of patients to report PI-related discomfort. Third, the model produced relatively modest sensitivity. However, this sensitivity is deemed valuable, given that the specificity was set to a high threshold, and the input was restricted to the first 72 hours after enrollment [<xref ref-type="bibr" rid="ref16">16</xref>]. The sensitivity reported in similar studies used the whole or more extended hospitalization stay and more data elements [<xref ref-type="bibr" rid="ref50">50</xref>-<xref ref-type="bibr" rid="ref52">52</xref>]. In addition, the sensitivity of our study was obtained through a comparison to a clinical trial instead of chart review data. Chart review does not always capture all positive cases due to possible errors in the review process [<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref54">54</xref>]. Fourth, the comparison with deep learning is not likely to be very fair because BERT-based models are usually applied to larger cohorts. Nevertheless, our result can be served as a reference for model selection for researchers working with similar sample sizes. Prabhakar et al applied ClinicalBERT to phenotype 10 diseases on a cohort consisting of 1610 discharge summaries [<xref ref-type="bibr" rid="ref41">41</xref>]. When only using ClinicalBERT, they obtained a very similar <italic>F</italic><sub>1</sub>-score (0.46) compared to our result [<xref ref-type="bibr" rid="ref41">41</xref>]. The suboptimal performances of the advanced deep learning model may suggest that study needs to be more evolved before applying deep learning to free-text-based clinical phenotyping. Tree-based ML models are recommended for detecting adverse event conditions from noisy, moderately sized text samples.</p>
      </sec>
      <sec>
        <title>Future Directions</title>
        <p>The present work focused on demonstrating ML models on cross-sectional EMR data can outperform the ICD-based PI identification algorithm. Future directions could include (1) leveraging cost-sensitive learning to assign various weights to assess the impact of misclassifying the patients with a PI, (2) identification of the potential risk features or predictors that may be associated with PI, (3) comparison of HAN-BERT against other novel NN structures, and (4) detailed ablation studies for assessing the performance of components on the designed models that will hopefully be integrated into a clinical decision-support system. These studies will require larger sample sizes than our current pilot study, but our current work can be used to create such a cohort.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Our study revealed the feasibility of using inpatient clinical notes documented for 3 days to detect HAPIs with increased accuracy over ICD methods. NLP and ML application on inpatient clinical notes allowed better and more timely use of the clinical narratives compared to summarizing them into ICD codes and DAD, thereby being a promising solution for precise, time-sensitive, population-based disease phenotyping. With the advent of digital technologies in health care, the results contribute toward an automated approach to better cohort identification, patient surveillance, and quality improvement for the treatment of hospital-acquired adverse events. The application of the model is particularly relevant for effectively mining clinical data that does not capture a large sample size for adverse effects phenotyping. The proposed method of identifying patients in acute care hospitals who are likely to have or develop PI will most likely be used by front-line hospital staff to prevent or manage PI earlier and more effectively.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Implementation details.</p>
        <media xlink:href="ai_v2i1e41264_app1.docx" xlink:title="DOCX File , 84 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Linguistic inquiry and word count analysis.</p>
        <media xlink:href="ai_v2i1e41264_app2.docx" xlink:title="DOCX File , 16 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Positive predictive value (PPV), negative predictive value (NPV), sensitivity, and specificity of the four algorithms and two International Classification of Diseases (ICD) algorithms, with changing thresholds ranging between 0.05 and 0.95.</p>
        <media xlink:href="ai_v2i1e41264_app3.docx" xlink:title="DOCX File , 103 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUC</term>
          <def>
            <p>area under the curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AUC-ROC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">AU-PRC</term>
          <def>
            <p>area under the precision-recall curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">BERT</term>
          <def>
            <p>bidirectional encoder representations from transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">BOW</term>
          <def>
            <p>bag-of-words</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">DAD</term>
          <def>
            <p>discharge abstract database</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">EMR</term>
          <def>
            <p>electronic medical record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">HAN</term>
          <def>
            <p>hierarchical attention network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">HAPIs</term>
          <def>
            <p>hospital-acquired pressure injuries</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">ICD</term>
          <def>
            <p>International Classification of Diseases</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">ICU</term>
          <def>
            <p>intensive care unit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">NPV</term>
          <def>
            <p>negative predictive value</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">PI</term>
          <def>
            <p>pressure injury</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">PPV</term>
          <def>
            <p>positive predictive value</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb17">RCT</term>
          <def>
            <p>randomized controlled trial</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb18">RF</term>
          <def>
            <p>random forest</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb19">SCM</term>
          <def>
            <p>Sunrise Clinical Manager</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb20">TF-IDF</term>
          <def>
            <p>term frequency-inverse document frequency</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb21">XGBoost</term>
          <def>
            <p>extreme gradient boosting</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Eastwood</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Weaver</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Quan</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Validation of two case definitions to identify pressure ulcers using hospital administrative data</article-title>
          <source>BMJ Open</source>
          <year>2017</year>
          <month>08</month>
          <day>28</day>
          <volume>7</volume>
          <issue>8</issue>
          <fpage>e016438</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopen.bmj.com/lookup/pmidlookup?view=long&#38;pmid=28851785"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2017-016438</pub-id>
          <pub-id pub-id-type="medline">28851785</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2017-016438</pub-id>
          <pub-id pub-id-type="pmcid">PMC5629722</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Woodbury</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Houghton</surname>
              <given-names>PE</given-names>
            </name>
          </person-group>
          <article-title>Prevalence of pressure ulcers in Canadian healthcare settings</article-title>
          <source>Ostomy Wound Manage</source>
          <year>2004</year>
          <month>10</month>
          <volume>50</volume>
          <issue>10</issue>
          <fpage>22</fpage>
          <lpage>24, 26, 28, 30, 32, 34, 36</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.o-wm.com/content/prevalence-pressure-ulcers-canadian-healthcare-settings"/>
          </comment>
          <pub-id pub-id-type="medline">15509880</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lyder</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Metersky</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Curry</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kliman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Verzier</surname>
              <given-names>NR</given-names>
            </name>
            <name name-style="western">
              <surname>Hunt</surname>
              <given-names>DR</given-names>
            </name>
          </person-group>
          <article-title>Hospital-acquired pressure ulcers: results from the national Medicare Patient Safety Monitoring System study</article-title>
          <source>J Am Geriatr Soc</source>
          <year>2012</year>
          <month>09</month>
          <volume>60</volume>
          <issue>9</issue>
          <fpage>1603</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1532-5415.2012.04106.x</pub-id>
          <pub-id pub-id-type="medline">22985136</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ebi</surname>
              <given-names>WE</given-names>
            </name>
            <name name-style="western">
              <surname>Hirko</surname>
              <given-names>GF</given-names>
            </name>
            <name name-style="western">
              <surname>Mijena</surname>
              <given-names>DA</given-names>
            </name>
          </person-group>
          <article-title>Nurses' knowledge to pressure ulcer prevention in public hospitals in Wollega: a cross-sectional study design</article-title>
          <source>BMC Nurs</source>
          <year>2019</year>
          <volume>18</volume>
          <fpage>20</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcnurs.biomedcentral.com/articles/10.1186/s12912-019-0346-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12912-019-0346-y</pub-id>
          <pub-id pub-id-type="medline">31139012</pub-id>
          <pub-id pub-id-type="pii">346</pub-id>
          <pub-id pub-id-type="pmcid">PMC6528293</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baharestani</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Black</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Carville</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cuddigan</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Dealey</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Defloor</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Harding</surname>
              <given-names>KG</given-names>
            </name>
            <name name-style="western">
              <surname>Lahmann</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Lubbers</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lyder</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Ohura</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Orsted</surname>
              <given-names>HL</given-names>
            </name>
            <name name-style="western">
              <surname>Reger</surname>
              <given-names>SI</given-names>
            </name>
            <name name-style="western">
              <surname>Romanelli</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sanada</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Dilemmas in measuring and using pressure ulcer prevalence and incidence: an international consensus</article-title>
          <source>Int Wound J</source>
          <year>2009</year>
          <volume>6</volume>
          <issue>2</issue>
          <fpage>97</fpage>
          <lpage>104</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/19432659"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/j.1742-481X.2009.00593.x</pub-id>
          <pub-id pub-id-type="medline">19432659</pub-id>
          <pub-id pub-id-type="pii">IWJ593</pub-id>
          <pub-id pub-id-type="pmcid">PMC7951416</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Malley</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Cook</surname>
              <given-names>KF</given-names>
            </name>
            <name name-style="western">
              <surname>Price</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Wildes</surname>
              <given-names>KR</given-names>
            </name>
            <name name-style="western">
              <surname>Hurdle</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Ashton</surname>
              <given-names>CM</given-names>
            </name>
          </person-group>
          <article-title>Measuring diagnoses: ICD code accuracy</article-title>
          <source>Health Serv Res</source>
          <year>2005</year>
          <volume>40</volume>
          <issue>5 Pt 2</issue>
          <fpage>1620</fpage>
          <lpage>1639</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/16178999"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/j.1475-6773.2005.00444.x</pub-id>
          <pub-id pub-id-type="medline">16178999</pub-id>
          <pub-id pub-id-type="pii">HESR444</pub-id>
          <pub-id pub-id-type="pmcid">PMC1361216</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dutta</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Hwang</surname>
              <given-names>HG</given-names>
            </name>
          </person-group>
          <article-title>The adoption of electronic medical record by physicians: a PRISMA-compliant systematic review</article-title>
          <source>Medicine (Baltimore)</source>
          <year>2020</year>
          <volume>99</volume>
          <issue>8</issue>
          <fpage>e19290</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1097/MD.0000000000019290"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/MD.0000000000019290</pub-id>
          <pub-id pub-id-type="medline">32080145</pub-id>
          <pub-id pub-id-type="pii">00005792-202002210-00075</pub-id>
          <pub-id pub-id-type="pmcid">PMC7034652</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>D'souza</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Doktorchik</surname>
              <given-names>CTA</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Eastwood</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Fine</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hemmelgarn</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Todd</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Quan</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Enhancing ICD-code-based case definition for heart failure using electronic medical record data</article-title>
          <source>J Card Fail</source>
          <year>2020</year>
          <volume>26</volume>
          <issue>7</issue>
          <fpage>610</fpage>
          <lpage>617</lpage>
          <pub-id pub-id-type="doi">10.1016/j.cardfail.2020.04.003</pub-id>
          <pub-id pub-id-type="medline">32304875</pub-id>
          <pub-id pub-id-type="pii">S1071-9164(20)30030-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ford</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Carroll</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>HE</given-names>
            </name>
            <name name-style="western">
              <surname>Scott</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cassell</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>Extracting information from the text of electronic medical records to improve case detection: a systematic review</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2016</year>
          <volume>23</volume>
          <issue>5</issue>
          <fpage>1007</fpage>
          <lpage>1015</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26911811"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocv180</pub-id>
          <pub-id pub-id-type="medline">26911811</pub-id>
          <pub-id pub-id-type="pii">ocv180</pub-id>
          <pub-id pub-id-type="pmcid">PMC4997034</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>WC</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Chiang</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Hribar</surname>
              <given-names>MR</given-names>
            </name>
          </person-group>
          <article-title>Applications of artificial intelligence to electronic health record data in ophthalmology</article-title>
          <source>Transl Vis Sci Technol</source>
          <year>2020</year>
          <volume>9</volume>
          <issue>2</issue>
          <fpage>13</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32704419"/>
          </comment>
          <pub-id pub-id-type="doi">10.1167/tvst.9.2.13</pub-id>
          <pub-id pub-id-type="medline">32704419</pub-id>
          <pub-id pub-id-type="pii">TVST-19-1997</pub-id>
          <pub-id pub-id-type="pmcid">PMC7347028</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bao</surname>
              <given-names>XY</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>WJ</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Niu</surname>
              <given-names>CZ</given-names>
            </name>
          </person-group>
          <article-title>[A customized method for information extraction from unstructured text data in the electronic medical records]</article-title>
          <source>Beijing Da Xue Xue Bao Yi Xue Ban</source>
          <year>2018</year>
          <volume>50</volume>
          <issue>2</issue>
          <fpage>256</fpage>
          <lpage>263</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://xuebao.bjmu.edu.cn/EN/Y2018/V50/I2/256"/>
          </comment>
          <pub-id pub-id-type="doi">10.3969/j.issn.1671-167X.2018.02.010</pub-id>
          <pub-id pub-id-type="medline">29643524</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Juhn</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence approaches using natural language processing to advance EHR-based clinical research</article-title>
          <source>J Allergy Clin Immunol</source>
          <year>2020</year>
          <volume>145</volume>
          <issue>2</issue>
          <fpage>463</fpage>
          <lpage>469</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31883846"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jaci.2019.12.897</pub-id>
          <pub-id pub-id-type="medline">31883846</pub-id>
          <pub-id pub-id-type="pii">S0091-6749(19)32604-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC7771189</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Szlosek</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Ferrett</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Using machine learning and natural language processing algorithms to automate the evaluation of clinical decision support in electronic medical record systems</article-title>
          <source>EGEMS (Wash DC)</source>
          <year>2016</year>
          <volume>4</volume>
          <issue>3</issue>
          <fpage>1222</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27683664"/>
          </comment>
          <pub-id pub-id-type="doi">10.13063/2327-9214.1222</pub-id>
          <pub-id pub-id-type="medline">27683664</pub-id>
          <pub-id pub-id-type="pii">egems1222</pub-id>
          <pub-id pub-id-type="pmcid">PMC5019306</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maarseveen</surname>
              <given-names>TD</given-names>
            </name>
            <name name-style="western">
              <surname>Meinderink</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Reinders</surname>
              <given-names>MJT</given-names>
            </name>
            <name name-style="western">
              <surname>Knitza</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Huizinga</surname>
              <given-names>TWJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kleyer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Simon</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>van den Akker</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>Knevel</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Machine learning electronic health record identification of patients with rheumatoid arthritis: algorithm pipeline development and validation study</article-title>
          <source>JMIR Med Inform</source>
          <year>2020</year>
          <volume>8</volume>
          <issue>11</issue>
          <fpage>e23930</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2020/11/e23930/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/23930</pub-id>
          <pub-id pub-id-type="medline">33252349</pub-id>
          <pub-id pub-id-type="pii">v8i11e23930</pub-id>
          <pub-id pub-id-type="pmcid">PMC7735897</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Horwitz</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Toh</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Using machine learning to identify health outcomes from electronic health record data</article-title>
          <source>Curr Epidemiol Rep</source>
          <year>2018</year>
          <volume>5</volume>
          <issue>4</issue>
          <fpage>331</fpage>
          <lpage>342</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30555773"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s40471-018-0165-9</pub-id>
          <pub-id pub-id-type="medline">30555773</pub-id>
          <pub-id pub-id-type="pmcid">PMC6289196</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>NB</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Mani</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Denny</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <article-title>Extracting and integrating data from entire electronic health records for detecting colorectal cancer cases</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2011</year>
          <volume>2011</volume>
          <fpage>1564</fpage>
          <lpage>1572</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/22195222"/>
          </comment>
          <pub-id pub-id-type="medline">22195222</pub-id>
          <pub-id pub-id-type="pmcid">PMC3243156</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="web">
          <article-title>Canada's health care system</article-title>
          <source>Government of Canada</source>
          <year>2019</year>
          <access-date>2022-12-16</access-date>
          <publisher-loc>Canada</publisher-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.canada.ca/en/health-canada/services/health-care-system/reports-publications/health-care-system/canada.html">https://www.canada.ca/en/health-canada/services/health-care-system/reports-publications/health-care-system/canada.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Denny</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lawand</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Perry</surname>
              <given-names>SD</given-names>
            </name>
          </person-group>
          <article-title>Compromised wounds in Canada</article-title>
          <source>Healthc Q</source>
          <year>2014</year>
          <volume>17</volume>
          <issue>1</issue>
          <fpage>7</fpage>
          <lpage>10</lpage>
          <pub-id pub-id-type="doi">10.12927/hcq.2014.23787</pub-id>
          <pub-id pub-id-type="medline">24844713</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="web">
          <article-title>About CIHI</article-title>
          <source>Canadian Institute for Health Information</source>
          <access-date>2023-01-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cihi.ca/en/about-cihi">https://www.cihi.ca/en/about-cihi</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="web">
          <article-title>Discharge abstract database metadata (DAD)</article-title>
          <source>Canadian Institute for Health Information</source>
          <access-date>2023-01-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cihi.ca/en/discharge-abstract-database-metadata-dad">https://www.cihi.ca/en/discharge-abstract-database-metadata-dad</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kaufman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Baylis</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Conly</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Hogan</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Stelfox</surname>
              <given-names>HT</given-names>
            </name>
            <name name-style="western">
              <surname>Southern</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Ghali</surname>
              <given-names>WA</given-names>
            </name>
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>CH</given-names>
            </name>
          </person-group>
          <article-title>Efficacy of a pressure-sensing mattress cover system for reducing interface pressure: study protocol for a randomized controlled trial</article-title>
          <source>Trials</source>
          <year>2015</year>
          <month>09</month>
          <day>29</day>
          <volume>16</volume>
          <fpage>434</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://trialsjournal.biomedcentral.com/articles/10.1186/s13063-015-0949-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13063-015-0949-x</pub-id>
          <pub-id pub-id-type="medline">26420303</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13063-015-0949-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC4588270</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Edsberg</surname>
              <given-names>LE</given-names>
            </name>
            <name name-style="western">
              <surname>Black</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Goldberg</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>McNichol</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sieggreen</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Revised National Pressure Ulcer Advisory Panel pressure injury staging system: revised pressure injury staging system</article-title>
          <source>J Wound Ostomy Continence Nurs</source>
          <year>2016</year>
          <volume>43</volume>
          <issue>6</issue>
          <fpage>585</fpage>
          <lpage>597</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27749790"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/WON.0000000000000281</pub-id>
          <pub-id pub-id-type="medline">27749790</pub-id>
          <pub-id pub-id-type="pmcid">PMC5098472</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Black</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Baharestani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cuddigan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dorner</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Edsberg</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Langemo</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Posthauer</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Ratliff</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Taler</surname>
              <given-names>G</given-names>
            </name>
            <collab>National Pressure Ulcer Advisory Panel</collab>
          </person-group>
          <article-title>National Pressure Ulcer Advisory Panel's updated pressure ulcer staging system</article-title>
          <source>Dermatol Nurs</source>
          <year>2007</year>
          <month>08</month>
          <volume>19</volume>
          <issue>4</issue>
          <fpage>343</fpage>
          <lpage>349; quiz 350</lpage>
          <pub-id pub-id-type="medline">17874603</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>D Apos Souza</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Doktorchik</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Quan</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Unlocking the potential of electronic health records for health research</article-title>
          <source>Int J Popul Data Sci</source>
          <year>2020</year>
          <month>01</month>
          <day>30</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>1123</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32935049"/>
          </comment>
          <pub-id pub-id-type="doi">10.23889/ijpds.v5i1.1123</pub-id>
          <pub-id pub-id-type="medline">32935049</pub-id>
          <pub-id pub-id-type="pii">5:02</pub-id>
          <pub-id pub-id-type="pmcid">PMC7473254</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>D'Souza</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Doktorchik</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Southern</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wiebe</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Quan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Eastwood</surname>
              <given-names>CA</given-names>
            </name>
          </person-group>
          <article-title>CREATE: a new data resource to support cardiac precision health</article-title>
          <source>CJC Open</source>
          <year>2021</year>
          <month>05</month>
          <volume>3</volume>
          <issue>5</issue>
          <fpage>639</fpage>
          <lpage>645</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2589-790X(20)30239-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.cjco.2020.12.019</pub-id>
          <pub-id pub-id-type="medline">34036259</pub-id>
          <pub-id pub-id-type="pii">S2589-790X(20)30239-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC8134941</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Guestrin</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>XGBoost: a scalable tree boosting system</article-title>
          <year>2016</year>
          <conf-name>KDD '16: The 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name>
          <conf-date>August 13-17 , 2016</conf-date>
          <conf-loc>San Francisco, California</conf-loc>
          <publisher-loc>New York, NY, USA</publisher-loc>
          <publisher-name>Association for Computing Machinery</publisher-name>
          <fpage>785</fpage>
          <lpage>794</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/2939672.2939785"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2939672.2939785</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>TK</given-names>
            </name>
          </person-group>
          <article-title>Random decision forests</article-title>
          <year>1995</year>
          <conf-name>Proceedings of 3rd International Conference on Document Analysis and Recognition</conf-name>
          <conf-date>August 14-16, 1995</conf-date>
          <conf-loc>Montreal, QC, Canada</conf-loc>
          <fpage>278</fpage>
          <lpage>282</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ieeexplore.ieee.org/document/598994"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/icdar.1995.598994</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Last</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kandel</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Maimon</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Information-theoretic algorithm for feature selection</article-title>
          <source>Pattern Recogn Lett</source>
          <year>2001</year>
          <month>5</month>
          <volume>22</volume>
          <issue>6-7</issue>
          <fpage>799</fpage>
          <lpage>811</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/science/article/abs/pii/S0167865501000198?via%3Dihub"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/s0167-8655(01)00019-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>ZS</given-names>
            </name>
          </person-group>
          <article-title>Distributional structure</article-title>
          <source>WORD</source>
          <year>2015</year>
          <month>12</month>
          <day>04</day>
          <volume>10</volume>
          <issue>2-3</issue>
          <fpage>146</fpage>
          <lpage>162</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://link.springer.com/chapter/10.1007/978-94-009-8467-7_1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/00437956.1954.11659520</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Sammut</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Webb</surname>
              <given-names>GI</given-names>
            </name>
          </person-group>
          <source>Encyclopedia of Machine Learning</source>
          <year>2010</year>
          <publisher-loc>New York</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <pub-id pub-id-type="doi">10.1007/978-0-387-30164-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="web">
          <article-title>Scikit-learn: machine learning in python</article-title>
          <source>Scikit-learn</source>
          <access-date>2023-01-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://scikit-learn.org/stable/">https://scikit-learn.org/stable/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sagi</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Rokach</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Ensemble learning: a survey</article-title>
          <source>Wiley Interdisciplinary Reviews-Data Mining and Knowledge Discovery</source>
          <year>2018</year>
          <volume>8</volume>
          <issue>4</issue>
          <fpage>e1249</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://wires.onlinelibrary.wiley.com/doi/abs/10.1002/widm.1249"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/widm.1249</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Dyer</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Smola</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hovy</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Hierarchical attention networks for document classification</article-title>
          <year>2016</year>
          <conf-name>Proceedings of the 2016 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies</conf-name>
          <conf-date>June 2016</conf-date>
          <conf-loc>San Diego, California</conf-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <fpage>1480</fpage>
          <lpage>1489</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/N16-1174/"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/n16-1174</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>BERT: pre-training of deep bidirectional transformers for language understanding</article-title>
          <source>arXiv. Preprint posted online October 11, 2018</source>
          <year>2018</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1810.04805"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Altosaar</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ranganath</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>ClinicalBERT: modeling clinical notes and predicting hospital readmission</article-title>
          <source>arXiv. Preprint posted online April 10, 2019</source>
          <year>2019</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1904.05342"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hull</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Medical language proficiency: A discussion of interprofessional language competencies and potential for patient risk</article-title>
          <source>Int J Nurs Stud</source>
          <year>2016</year>
          <month>02</month>
          <volume>54</volume>
          <fpage>158</fpage>
          <lpage>172</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ijnurstu.2015.02.015</pub-id>
          <pub-id pub-id-type="medline">25863658</pub-id>
          <pub-id pub-id-type="pii">S0020-7489(15)00061-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bethard</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dligach</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sadeque</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>TA</given-names>
            </name>
          </person-group>
          <article-title>Does BERT need domain adaptation for clinical negation detection?</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2020</year>
          <month>04</month>
          <day>01</day>
          <volume>27</volume>
          <issue>4</issue>
          <fpage>584</fpage>
          <lpage>591</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32044989"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocaa001</pub-id>
          <pub-id pub-id-type="medline">32044989</pub-id>
          <pub-id pub-id-type="pii">5733888</pub-id>
          <pub-id pub-id-type="pmcid">PMC7075528</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alsentzer</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Boag</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>WH</given-names>
            </name>
            <name name-style="western">
              <surname>Jindi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Naumann</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>McDermott</surname>
              <given-names>MBA</given-names>
            </name>
          </person-group>
          <article-title>Publicly available clinical BERT embeddings</article-title>
          <source>arXiv. Preprint posted online April 6, 2019</source>
          <year>2019</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1904.03323"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/w19-1909</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alsentzer</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Boag</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>WH</given-names>
            </name>
            <name name-style="western">
              <surname>Jindi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Naumann</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>McDermott</surname>
              <given-names>MBA</given-names>
            </name>
          </person-group>
          <article-title>Publicly available clinical BERT embeddings</article-title>
          <year>2019</year>
          <conf-name>Proceedings of the 2nd Clinical Natural Language Processing Workshop</conf-name>
          <conf-date>June 2019</conf-date>
          <conf-loc>Minneapolis, Minnesota, USA</conf-loc>
          <fpage>72</fpage>
          <lpage>78</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/W19-1909</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>NF</given-names>
            </name>
            <name name-style="western">
              <surname>Gardner</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Belinkov</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>NA</given-names>
            </name>
          </person-group>
          <article-title>Linguistic Knowledge and Transferability of Contextual Representations</article-title>
          <year>2019</year>
          <conf-name>Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers)</conf-name>
          <conf-date>June 2019</conf-date>
          <conf-loc>Minneapolis, Minnesota, USA</conf-loc>
          <fpage>1073</fpage>
          <lpage>1094</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/N19-1112</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Prabhakar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shidharth</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kamath</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Neural language modeling of unstructured clinical notes for automated patient phenotyping</article-title>
          <source>2022 56th Annual Conference on Information Sciences and Systems (CISS)</source>
          <year>2022</year>
          <conf-name>2022 56th Annual Conference on Information Sciences and Systems (CISS)</conf-name>
          <conf-date>9-11 March 2022</conf-date>
          <conf-loc>Princeton, NJ, USA</conf-loc>
          <fpage>142</fpage>
          <lpage>147</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ieeexplore.ieee.org/document/9751198"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Seabold</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Perktold</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Statsmodels: econometric and statistical modeling with python</article-title>
          <year>2010</year>
          <conf-name>Proceedings of the 9th Python in Science Conference</conf-name>
          <conf-date>June 28-30, 2010</conf-date>
          <conf-loc>Austin</conf-loc>
          <fpage>92</fpage>
          <lpage>96</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://conference.scipy.org/proceedings/scipy2010/seabold.html"/>
          </comment>
          <pub-id pub-id-type="doi">10.25080/majora-92bf1922-011</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="web">
          <article-title>Comparison of proportions calculator</article-title>
          <source>MedCalc</source>
          <access-date>2023-01-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.medcalc.org/calc/comparison_of_proportions.php">https://www.medcalc.org/calc/comparison_of_proportions.php</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="web">
          <article-title>Comparison of means calculator</article-title>
          <source>MedCalc</source>
          <access-date>2023-01-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.medcalc.org/calc/comparison_of_means.php">https://www.medcalc.org/calc/comparison_of_means.php</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Raetz</surname>
              <given-names>JGM</given-names>
            </name>
            <name name-style="western">
              <surname>Wick</surname>
              <given-names>KH</given-names>
            </name>
          </person-group>
          <article-title>Common questions about pressure ulcers</article-title>
          <source>Am Fam Phys</source>
          <year>2015</year>
          <month>11</month>
          <day>15</day>
          <volume>92</volume>
          <issue>10</issue>
          <fpage>888</fpage>
          <lpage>894</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aafp.org/link_out?pmid=26554282"/>
          </comment>
          <pub-id pub-id-type="medline">26554282</pub-id>
          <pub-id pub-id-type="pii">d12200</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Braden</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Bergstrom</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>A conceptual schema for the study of the etiology of pressure sores</article-title>
          <source>Rehabil Nurs</source>
          <year>1987</year>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>8</fpage>
          <lpage>12</lpage>
          <pub-id pub-id-type="doi">10.1002/j.2048-7940.1987.tb00541.x</pub-id>
          <pub-id pub-id-type="medline">3643620</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Melton</surname>
              <given-names>GB</given-names>
            </name>
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Automated detection of adverse events using natural language processing of discharge summaries</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2005</year>
          <volume>12</volume>
          <issue>4</issue>
          <fpage>448</fpage>
          <lpage>457</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/15802475"/>
          </comment>
          <pub-id pub-id-type="doi">10.1197/jamia.M1794</pub-id>
          <pub-id pub-id-type="medline">15802475</pub-id>
          <pub-id pub-id-type="pii">M1794</pub-id>
          <pub-id pub-id-type="pmcid">PMC1174890</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sotoodeh</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gero</surname>
              <given-names>ZH</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Hertzberg</surname>
              <given-names>VS</given-names>
            </name>
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <article-title>Pressure ulcer injury in unstructured clinical notes: detection and interpretation</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2020</year>
          <volume>2020</volume>
          <fpage>1160</fpage>
          <lpage>1169</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33936492"/>
          </comment>
          <pub-id pub-id-type="medline">33936492</pub-id>
          <pub-id pub-id-type="pii">152_3415683</pub-id>
          <pub-id pub-id-type="pmcid">PMC8075497</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lima</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Freed</surname>
              <given-names>GL</given-names>
            </name>
            <name name-style="western">
              <surname>O'Malley</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Emeny</surname>
              <given-names>RT</given-names>
            </name>
          </person-group>
          <article-title>Machine learning approaches for hospital acquired pressure injuries: a retrospective study of electronic medical records</article-title>
          <source>Front Med Technol</source>
          <year>2022</year>
          <volume>4</volume>
          <fpage>926667</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35782577"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fmedt.2022.926667</pub-id>
          <pub-id pub-id-type="medline">35782577</pub-id>
          <pub-id pub-id-type="pmcid">PMC9243224</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kwon</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Na</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Jun</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kweon</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hur</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chae</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>PH</given-names>
            </name>
            <name name-style="western">
              <surname>Ahn</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>DH</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Electronic medical record-based machine learning approach to predict the risk of 30-day adverse cardiac events after invasive coronary treatment: machine learning model development and validation</article-title>
          <source>JMIR Med Inform</source>
          <year>2022</year>
          <month>05</month>
          <day>11</day>
          <volume>10</volume>
          <issue>5</issue>
          <fpage>e26801</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2022/5/e26801/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/26801</pub-id>
          <pub-id pub-id-type="medline">35544292</pub-id>
          <pub-id pub-id-type="pii">v10i5e26801</pub-id>
          <pub-id pub-id-type="pmcid">PMC9133980</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Borjali</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Magnéli</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Malchau</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Muratoglu</surname>
              <given-names>OK</given-names>
            </name>
            <name name-style="western">
              <surname>Varadarajan</surname>
              <given-names>KM</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing with deep learning for medical adverse event detection from free-text medical narratives: a case study of detecting total hip replacement dislocation</article-title>
          <source>Comput Biol Med</source>
          <year>2021</year>
          <month>02</month>
          <volume>129</volume>
          <fpage>104140</fpage>
          <pub-id pub-id-type="doi">10.1016/j.compbiomed.2020.104140</pub-id>
          <pub-id pub-id-type="medline">33278631</pub-id>
          <pub-id pub-id-type="pii">S0010-4825(20)30471-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rojas</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Carey</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Edelson</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Venable</surname>
              <given-names>LR</given-names>
            </name>
            <name name-style="western">
              <surname>Howell</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Churpek</surname>
              <given-names>MM</given-names>
            </name>
          </person-group>
          <article-title>Predicting intensive care unit readmission with machine learning using electronic health record data</article-title>
          <source>Ann Am Thorac Soc</source>
          <year>2018</year>
          <month>07</month>
          <volume>15</volume>
          <issue>7</issue>
          <fpage>846</fpage>
          <lpage>853</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29787309"/>
          </comment>
          <pub-id pub-id-type="doi">10.1513/AnnalsATS.201710-787OC</pub-id>
          <pub-id pub-id-type="medline">29787309</pub-id>
          <pub-id pub-id-type="pmcid">PMC6207111</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brennan</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Localio</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Laird</surname>
              <given-names>NL</given-names>
            </name>
          </person-group>
          <article-title>Reliability and validity of judgments concerning adverse events suffered by hospitalized patients</article-title>
          <source>Med Care</source>
          <year>1989</year>
          <month>12</month>
          <volume>27</volume>
          <issue>12</issue>
          <fpage>1148</fpage>
          <lpage>1158</lpage>
          <pub-id pub-id-type="doi">10.1097/00005650-198912000-00006</pub-id>
          <pub-id pub-id-type="medline">2593729</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haley</surname>
              <given-names>RW</given-names>
            </name>
            <name name-style="western">
              <surname>Schaberg</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>McClish</surname>
              <given-names>DK</given-names>
            </name>
            <name name-style="western">
              <surname>Quade</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Crossley</surname>
              <given-names>KB</given-names>
            </name>
            <name name-style="western">
              <surname>Culver</surname>
              <given-names>DH</given-names>
            </name>
            <name name-style="western">
              <surname>Morgan</surname>
              <given-names>WM</given-names>
            </name>
            <name name-style="western">
              <surname>McGowan</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Shachtman</surname>
              <given-names>RH</given-names>
            </name>
          </person-group>
          <article-title>The accuracy of retrospective chart review in measuring nosocomial infection rates. Results of validation studies in pilot hospitals</article-title>
          <source>Am J Epidemiol</source>
          <year>1980</year>
          <month>05</month>
          <volume>111</volume>
          <issue>5</issue>
          <fpage>516</fpage>
          <lpage>533</lpage>
          <pub-id pub-id-type="doi">10.1093/oxfordjournals.aje.a112931</pub-id>
          <pub-id pub-id-type="medline">7377196</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
