<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR AI</journal-id><journal-id journal-id-type="publisher-id">ai</journal-id><journal-id journal-id-type="index">41</journal-id><journal-title>JMIR AI</journal-title><abbrev-journal-title>JMIR AI</abbrev-journal-title><issn pub-type="epub">2817-1705</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v4i1e63147</article-id><article-id pub-id-type="doi">10.2196/63147</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Natural Language Processing for Identification of Hospitalized People Who Use Drugs: Cohort Study</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Sato</surname><given-names>Taisuke</given-names></name><degrees>BA</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Grussing</surname><given-names>Emily D</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Patel</surname><given-names>Ruchi</given-names></name><degrees>BDS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ridgway</surname><given-names>Jessica</given-names></name><degrees>MD, MS</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Suzuki</surname><given-names>Joji</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Sweigart</surname><given-names>Benjamin</given-names></name><degrees>MA</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Miller</surname><given-names>Robert</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Wurcel</surname><given-names>Alysse G</given-names></name><degrees>MD, MS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Tufts Medical Center</institution><addr-line>Tupper Building 4F, 800 Washington St</addr-line><addr-line>Boston</addr-line><addr-line>MA</addr-line><country>United States</country></aff><aff id="aff2"><institution>University of Chicago School of Medicine</institution><addr-line>Chicago</addr-line><addr-line>IL</addr-line><country>United States</country></aff><aff id="aff3"><institution>Brigham and Women's Hospital</institution><addr-line>Boston</addr-line><addr-line>MA</addr-line><country>United States</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Luo</surname><given-names>Gang</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Morin</surname><given-names>Christophe</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Torgersen</surname><given-names>Jessie</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Huang</surname><given-names>Xiaoshuo</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Alysse G Wurcel, MD, MS, Tufts Medical Center, Tupper Building 4F, 800 Washington St, Boston, MA, United States, 1 617 636 4605; <email>Alysse.Wurcel@bmc.org</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>18</day><month>7</month><year>2025</year></pub-date><volume>4</volume><elocation-id>e63147</elocation-id><history><date date-type="received"><day>11</day><month>06</month><year>2024</year></date><date date-type="rev-recd"><day>17</day><month>03</month><year>2025</year></date><date date-type="accepted"><day>17</day><month>03</month><year>2025</year></date></history><copyright-statement>&#x00A9; Taisuke Sato, Emily D Grussing, Ruchi Patel, Jessica Ridgway, Joji Suzuki, Benjamin Sweigart, Robert Miller, Alysse G Wurcel. Originally published in JMIR AI (<ext-link ext-link-type="uri" xlink:href="https://ai.jmir.org">https://ai.jmir.org</ext-link>), 18.7.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR AI, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.ai.jmir.org/">https://www.ai.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://ai.jmir.org/2025/1/e63147"/><abstract><sec><title>Background</title><p>People who use drugs (PWUD) are at heightened risk of severe injection&#x2013;related infections. Current research relies on billing codes to identify PWUD&#x2014;a methodology with suboptimal accuracy that may underestimate the economic, racial, and ethnic diversity of hospitalized PWUD.</p></sec><sec><title>Objective</title><p>The goal of this study is to examine the impact of natural language processing (NLP) on enhancing identification of PWUD in electronic medical records, with a specific focus on determining improved systems of identifying populations who may previously been missed, including people who have low income or those from racially and ethnically minoritized populations.</p></sec><sec sec-type="methods"><title>Methods</title><p>Health informatics specialists assisted in querying a cohort of likely PWUD hospital admissions at Tufts Medical Center between 2020&#x2010;2022 using the following criteria: (1) <italic>ICD-10</italic> codes indicative of drug use, (2) positive drug toxicology results, (3) prescriptions for medications for opioid use disorder, and (4) applying NLP-detected presence of &#x201C;token&#x201D; keywords in the electronic medical records likely indicative of the patient being a PWUD. Hospital admissions were split into two groups: highly documented (all four criteria present) and minimally documented (NLP-only). These groups were examined to assess the impact of race, ethnicity, and social vulnerability index. With chart review as the &#x201C;gold standard,&#x201D; the positive predictive value was calculated.</p></sec><sec sec-type="results"><title>Results</title><p>The cohort included 4548 hospitalization admissions, with broad heterogeneity in how people entered the cohort and subcohorts; a total of 288 hospital admissions entered the cohort through NLP token presence alone. NLP demonstrated a 54% positive predictive value, outperforming biomarkers, prescription for medications for opioid use disorder, and <italic>ICD</italic> codes in identifying hospitalizations of PWUD. Additionally, NLP significantly enhanced these methods when integrated into the identification algorithm. The study also found that people from racially and ethnically minoritized communities and those with lower social vulnerability index were significantly more likely to have lower rates of PWUD-related documentation.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>NLP proved effective in identifying hospitalizations of PWUD, surpassing traditional methods. While further refinement is needed, NLP shows promising potential in minimizing health care disparities.</p></sec></abstract><kwd-group><kwd>SIRI</kwd><kwd>natural language processing</kwd><kwd>NLP</kwd><kwd>people who use drugs</kwd><kwd>substance use disorder</kwd><kwd>HIV</kwd><kwd>hepatitis C</kwd><kwd>HCV</kwd><kwd>substance use</kwd><kwd>readmission</kwd><kwd>mortality</kwd><kwd>assessment</kwd><kwd>cardiovascular disease</kwd><kwd>drug use</kwd><kwd>electronic medical record</kwd><kwd>serious injection-related infections</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>In the absence of harm reduction tools, people who use drugs (PWUD) are at increased risk of disease, hospitalization, and death [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. Gaps in the provision of guideline-concordant care to hospitalized PWUD occur, especially among individuals from racially and ethnically minoritized communities [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref6">6</xref>]. Barriers to optimization of health care for hospitalized PWUD include undertreatment of pain and substance use disorders, which have been linked to discharges before medical optimization and higher rates of readmission and mortality [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref9">9</xref>]. Best practices for managing PWUD in a hospitalized setting include addiction care itself as well as treatment and prevention of life-threatening infections [<xref ref-type="bibr" rid="ref10">10</xref>].</p><p>Effective identification of hospitalized PWUD is essential for epidemiological tracking, resource allocation, and evaluating interventions. However, current methodologies often fail to accurately capture this population. The &#x201C;gold standard&#x201D; for identifying PWUD hospitalizations is human-guided chart review, a highly regulated and time-intensive process with potential consequences for breach of confidentiality [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. Administrative billing codes (also known as International Classification of Disease codes, ICD codes) have been used for PWUD identification. Unlike several other common conditions such as cardiovascular diseases for which <italic>ICD-10</italic> codes are highly accurate [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>], a systematic review found that for identification of PWUD, <italic>ICD-9/10</italic> codes had high specificity but limited sensitivity ranging from 47%&#x2010;83% [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. Indicators for substance use tend to be noted in the social history section of the electronic medical record (EMR) rather than a formal diagnosis. Some researchers have used the hepatitis C virus (HCV) codes as a marker of drug use, although there are a substantial number of people with HCV who do not currently use drugs or have ever used drugs [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>].</p><p>The barrier to identifying PWUD can potentially be addressed with natural language processing (NLP), to leverage artificial intelligence (AI) algorithms for interpretation of the written text in a context-relevant manner [<xref ref-type="bibr" rid="ref18">18</xref>]. NLP has been effectively applied to medical examiners&#x2019; reports to increase the accuracy of identifying substance use disorder-related deaths [<xref ref-type="bibr" rid="ref19">19</xref>], identify substance use disorders in outpatients with HIV [<xref ref-type="bibr" rid="ref20">20</xref>], and enhance preventive care for hospitalized patients with HIV [<xref ref-type="bibr" rid="ref17">17</xref>]. In particular, regular expression (RegEx), a rule-based text-matching framework, has been used to identify text patterns [<xref ref-type="bibr" rid="ref21">21</xref>]. RegEx has recently been used as a tool for identification of encounters with people with opioid use disorder (OUD) [<xref ref-type="bibr" rid="ref22">22</xref>]. A few studies have examined the application of NLP to identify hospitalized PWUD admitted for bloodstream infections; however, these efforts were single-center evaluations, focused only on injection drug use [<xref ref-type="bibr" rid="ref23">23</xref>-<xref ref-type="bibr" rid="ref26">26</xref>]. Despite its innovative capacity to identify PWUD, the field of NLP methodology is nascent. The goal of this study was to evaluate the impact of NLP on the creation of a cohort of hospitalized PWUD and to evaluate disparities in documentation.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Definition of PWUD</title><p>As &#x201C;drug use&#x201D; is a broad term, it is worth emphasizing that &#x201C;PWUD&#x201D; in this study includes the use of cocaine, methamphetamine, fentanyl, and heroin. We use the term PWUD to describe people in the cohort, rather than &#x201C;people who inject drugs&#x201D;&#x2014;another term used to describe this population&#x2014;because these drugs can be consumed intravenously, smoked, or snorted. We do not use the term substance use disorder (SUD), as some PWUD do not meet diagnostic criteria for SUD and may not identify as having an SUD. Although drug use can also include cannabis and alcohol, we did not include these substances in the definition of drug use.</p></sec><sec id="s2-2"><title>Overview of Cohort Creation</title><p>Tufts Medical Center (TuftsMC) is a tertiary health care center located in Boston, Massachusetts, with a strong history of clinician-researcher partnerships to improve care for PWUD [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>]. A health informatics specialist (RM) queried hospitalizations likely involving PWUD at TuftsMC between January 1, 2020, and April 1, 2022, guided by specific criteria (see below). The unit of measurement was hospitalization encounters, not individual patients, even if from the same patients, which requires separate clinical considerations and presents a distinct opportunity for the implementation of evidence-based practices such as introducing medications for OUD.</p><p>The presence of any of the following criteria (ie, abbreviated with the letters B, D, M, and N) were used to qualify the hospitalizations for inclusion in the PWUD cohort:</p><list list-type="bullet"><list-item><p>B (Biomarkers): In line with a previous study, positive urine toxicology for drugs or medications for SUD (eg, cocaine, amphetamine, methadone, suboxone, fentanyl, opiate, oxycodone), positive HCV antibody with positive or quantifiable HCV viral load [<xref ref-type="bibr" rid="ref29">29</xref>]</p></list-item><list-item><p>D (Diagnostic codes): Presence of <italic>ICD-9</italic> and or <italic>ICD-10</italic> code for overdose, substance use disorders, substance-related disorders, and Hepatitis C, considering historical diagnoses and those retained in EMRs and inactivated diagnoses that did not migrate with the transition</p></list-item><list-item><p>M (Medications for opioid use disorder): Sublingual buprenorphine (suboxone or subutex) or oral methadone listed as medications in outpatient medication reconciliation, given during hospitalization, or prescribed at discharge. We noted that methadone for OUD is not a medication prescribed at discharge, but is included via discharge reconciliation [<xref ref-type="bibr" rid="ref30">30</xref>].</p></list-item><list-item><p>N (Natural language processing): An iterative list of keywords that are commonly used to describe PWUD in EMR (<xref ref-type="table" rid="table1">Table 1</xref>, <xref ref-type="other" rid="box1">Textbox 1</xref>) was refined by the study team and then provided to the health informatics specialists [<xref ref-type="bibr" rid="ref31">31</xref>]. The RegEx patterns were used to identify keywords in the EMRs, accounting for misspellings and variations in context, with incorporation of tokenizing and parsing syntax, context embedding, and approximate string matching. These features enabled context-specific word detection that accounted for minor misspellings or aggregated words. The algorithm was run on the entire EMR, including but not limited to nursing notes, physician notes, discharge summaries, and emergency room records.</p></list-item></list><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>List of <italic>ICD-9/10</italic> Codes for inclusion into PWUD cohort.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Parent code</td><td align="left" valign="bottom">Description</td></tr></thead><tbody><tr><td align="left" valign="top"><italic>F11</italic></td><td align="left" valign="top">Opioid-related disorders</td></tr><tr><td align="left" valign="top"><italic>F14</italic></td><td align="left" valign="top">Cocaine-related disorder</td></tr><tr><td align="left" valign="top"><italic>F15</italic></td><td align="left" valign="top">Other stimulant&#x2013;related disorders</td></tr><tr><td align="left" valign="top"><italic>T400-T406; T436</italic></td><td align="left" valign="top">Poisoning by opium, heroin, other opioids, methadone, synthetic narcotics, cocaine, unspecified narcotics and psychostimulants.</td></tr><tr><td align="left" valign="top"><italic>0.70.41, 070.44, 070.51, 070.54, 070.70, 070.71</italic></td><td align="left" valign="top">Hepatitis C</td></tr><tr><td align="left" valign="top"><italic>B18.2</italic></td><td align="left" valign="top">Chronic viral hepatitis C</td></tr></tbody></table></table-wrap><boxed-text id="box1"><title> List of words programmed into NLP to detect PWUD encounters.</title><p>IVDU, FENTANYL, Methadone, heroin, suboxone, IVDA, drug abuse, SUD, Substance use disorder, opioid use disorder, opioid abuse, OUD, opioid overdose, illicit drugs, addicted, addict, drug addict, injection drug use, intravenous drug use, uses fentanyl, Uses heroin, PWID, abuses drugs, injects heroin, injects drugs, injects fentanyl.</p></boxed-text><p>In addition to the above data, each encounter also had linked demographics data (eg, age, race, ethnicity, gender), length of hospitalization, and social vulnerability index (SVI). The SVI is a tool developed by the Centers for Disease Control and Prevention, used to assess the community&#x2019;s susceptibility to disasters and emergencies; it uses 16 census-based data points to help assess local communities&#x2019; need for aid before and after the disaster [<xref ref-type="bibr" rid="ref32">32</xref>]. It evaluates factors such as socioeconomic status, disability, minority status, and areas that may need additional support during crises. It is a holistic way to represent the social and economic stability of neighborhoods. The SVI was provided as a quartile (eg, 1, 2, 3, 4), with 1 representing the highest level of social vulnerability. Using the Stata software (version; StataCorp), we examined the association between key indicators (ie, race and SVI) and the level of documentation for SUDs.</p></sec><sec id="s2-3"><title>Data Analysis</title><p>Hospitalizations were classified based on the combination of domains (ie, B, D, M, N). A percentage of charges from the D-only and N-only group was selected for chart review by two research members (EDG, TS). The number of charts reviewed was determined by feasibility and proportion to the entire cohort. Coders reviewed each chart for information that indicated drug use (excluding alcohol and cannabis). The process for determining whether a hospitalization event occurred with PWUD included: (1) assessing three types of notes in each chart&#x2014;emergency department admission note, history of present illness, and discharge summary and (2) using the Epic search bar&#x2014;a tool that allows for keyword search within a person&#x2019;s EMR profile&#x2014;for keywords (<xref ref-type="other" rid="box1">Textbox 1</xref>).. The coders conducted intercoder reliability testing after completing their first 20 chart reviews, which showed consistency. A logistic regression was performed to examine factors for drug use associated with high documentation, introduced into the cohort by the presence of all of the 4 domains (B, D, M, N) versus low documentation (NLP only).</p></sec><sec id="s2-4"><title>Ethical Considerations</title><p>The study has been approved by the Health Sciences Institutional Review Board of the TuftsMC with waiver of consent granted (approval no. 2450). Identifiable data was only accessed by IRB approved study staff with approrpiate training. Identifiable data was stored on a secure file. As this was a retrospective study, there was no compensation provided to the cohort.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><p>The Venn diagram illustrates how 4548 hospitalizations involving PWUD entered the cohort based on inclusion criteria (<xref ref-type="fig" rid="figure1">Figure 1</xref>). The study participants&#x2019; characteristics are shown in <xref ref-type="table" rid="table2">Table 2</xref>, along with results of the multivariable logistic regression. People who identified as White or non-Hispanic had higher odds of entering the cohort through NLP alone (adjusted odds ratio [aOR]=2.07; 95% CI 1.54, 2.79). Notably, individuals from the most socioeconomically disadvantaged quartiles (1st and 2nd SVI quartiles) were also significantly more likely to enter the cohort through NLP alone (aOR=1.41; 95% CI 1.06, 1.88). The subcohorts with the highest number of hospitalizations were those with ICD codes only (D-group, n=958), biomarkers only (B-group, n=734), and NLP with all four criteria (B, D, N, M group, n=726). Approximately 10% (n=93) individuals in the D-only group and 35% (n=99) in the N-only group underwent chart review. As shown in <xref ref-type="table" rid="table3">Table 3</xref>, the positive predictive value (PPV) of the NLP-only cohort was 54%, outperforming the diagnostic codes-only cohort, which had a PPV of 43%. This demonstrates NLP&#x2019;s ability to enhance identification of PWUD hospitalizations beyond traditional methods.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Venn diagram illustrating the total number of hospitalizations in each cohort. B: biomarkers; D: diagnostic codes; M: medications for opioid use disorder; N: natural language processing.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v4i1e63147_fig01.png"/></fig><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Descriptive analysis of PWUD cohort and factors associated with entering the cohort as highly-documented (BDMN<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup>) or minimally-documented (NLP<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup> only).</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Variables</td><td align="left" valign="bottom" colspan="3">Criteria for entering cohort</td><td align="left" valign="bottom">Unadjusted OR<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup> (95% CI)</td><td align="left" valign="bottom">Adjusted OR<break/>(95% CI)</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Encounters (N=4548)</td><td align="left" valign="top">Encounters-BDMN (n=726)</td><td align="left" valign="top">Encounters-NLP<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup> only (n=288)</td><td align="left" valign="top"/><td align="left" valign="top"/></tr></thead><tbody><tr><td align="left" valign="top">Age (years), mean (SD)</td><td align="left" valign="top">47.9 (13.8)</td><td align="left" valign="top">43.3 (10.7)</td><td align="left" valign="top">45.6 (14.5)</td><td align="left" valign="top">&#x2013;<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup></td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top" colspan="6">Sex, n (%)</td></tr><tr><td align="left" valign="top">&#x2003;Male</td><td align="left" valign="top">2837 (62.4)</td><td align="left" valign="top">457 (62.9)</td><td align="left" valign="top">155 (53.8)</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top">&#x2003;Female</td><td align="left" valign="top">1711 (37.6)</td><td align="left" valign="top">269 (37.1)</td><td align="left" valign="top">133 (46.2)</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top">Race/Ethnicity, n (%)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Racially/Ethnically minoritized<sup><xref ref-type="table-fn" rid="table2fn5">e</xref></sup></td><td align="left" valign="top">1583 (34.8)</td><td align="left" valign="top">176 (24.2)</td><td align="left" valign="top">114 (60.4)</td><td align="left" valign="top">1.00 (Ref)</td><td align="left" valign="top">1.00 (Ref)</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;Black</td><td align="left" valign="top">773 (17)</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;Hispanic</td><td align="left" valign="top">469 (10.3)</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;Asian</td><td align="left" valign="top">122 (2.7)</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;Asian Indian</td><td align="left" valign="top">24 (0.5)</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;Hawaiian</td><td align="left" valign="top">1 (0.02)</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;Other</td><td align="left" valign="top">22 (0.5)</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;Unknown</td><td align="left" valign="top">172 (3.8)</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top">&#x2003;White/non-Hispanic</td><td align="left" valign="top">2965 (65.2)</td><td align="left" valign="top">550 (75.8)</td><td align="left" valign="top">174 (39.6)</td><td align="left" valign="top">2.04 (1.53, 2.73)</td><td align="left" valign="top">2.07 (1.54, 2.79)<sup><xref ref-type="table-fn" rid="table2fn5">e</xref></sup></td></tr><tr><td align="left" valign="top">Length of hospitalization, mean (SD)</td><td align="left" valign="top">38.7 (26.3)</td><td align="left" valign="top">41.5 (25.7)</td><td align="left" valign="top">34.7 (26.4)</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top">Social variability index (quartiles)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;3rd-4th</td><td align="left" valign="top">2462 (54.1)</td><td align="left" valign="top">461 (63.5)</td><td align="left" valign="top">163 (56.6)</td><td align="left" valign="top">1.34 (1.01, 1.77)</td><td align="left" valign="top">1.41 (1.06, 1.88)<sup><xref ref-type="table-fn" rid="table2fn6">f</xref></sup></td></tr><tr><td align="left" valign="top">&#x2003;1st-2nd</td><td align="left" valign="top">2070 (45.51)</td><td align="left" valign="top">262 (36.1)</td><td align="left" valign="top">124 (43.1)</td><td align="left" valign="top">1.00 (Ref)</td><td align="left" valign="top">1.00 (Ref)</td></tr><tr><td align="left" valign="top">&#x2003;Missing</td><td align="left" valign="top">16 (0.4)</td><td align="left" valign="top">3 (0.4)</td><td align="left" valign="top">1 (0.4)</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top" colspan="6">Urine toxicology, n (%)</td></tr><tr><td align="left" valign="top">&#x2003;Opiate</td><td align="left" valign="top">658 (14.5)</td><td align="left" valign="top">136 (18.7)</td><td align="left" valign="top">0</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top">&#x2003;Fentanyl</td><td align="left" valign="top">1313 (24.9)</td><td align="left" valign="top">430 (59.2)</td><td align="left" valign="top">0</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top">&#x2003;Oxycodone</td><td align="left" valign="top">369 (8.1)</td><td align="left" valign="top">66 (9.1)</td><td align="left" valign="top">0</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top">&#x2003;Methadone</td><td align="left" valign="top">272 (5.9)</td><td align="left" valign="top">224 (30.9)</td><td align="left" valign="top">0</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top">&#x2003;Cocaine</td><td align="left" valign="top">622 (13.7)</td><td align="left" valign="top">258 (35.5)</td><td align="left" valign="top">0</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top">&#x2003;Amphetamine</td><td align="left" valign="top">323 (7.1)</td><td align="left" valign="top">153 (21.1)</td><td align="left" valign="top">0</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top">Primary language, n (%)</td><td align="left" valign="top" colspan="5"/></tr><tr><td align="left" valign="top">&#x2003;English</td><td align="left" valign="top">4296 (94.5)</td><td align="left" valign="top">703 (96.8)</td><td align="left" valign="top">270 (93.8)</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr><tr><td align="left" valign="top">&#x2003;Spanish</td><td align="left" valign="top">123 (2.7)</td><td align="left" valign="top">23 (3.2)</td><td align="left" valign="top">11 (3.8)</td><td align="left" valign="top">&#x2013;</td><td align="left" valign="top">&#x2013;</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>BDMN: All criteria for entry into the cohort satisfied.</p></fn><fn id="table2fn2"><p><sup>b</sup>NLP: natural language processing.</p></fn><fn id="table2fn3"><p><sup>c</sup>OR: odds ratio.</p></fn><fn id="table2fn4"><p><sup>d</sup>Not applicable.</p></fn><fn id="table2fn5"><p><sup>e</sup>Multivariable model adjusted for age, sex, and social variability index.</p></fn><fn id="table2fn6"><p><sup>f</sup>Multivariable model adjusted for age, sex, and race.</p></fn></table-wrap-foot></table-wrap><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Positive predictive values of NLP-only<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup> cohort and ICD-only<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup> cohorts.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Cohort</td><td align="left" valign="bottom">Hospitalizations in the cohort, n</td><td align="left" valign="bottom">Charts reviewed, n</td><td align="left" valign="bottom">Charts confirmed as true PWUD<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup> by chart review, n</td><td align="left" valign="bottom">Positive predictive value (%)</td></tr></thead><tbody><tr><td align="left" valign="top">D (diagnostic codes present)</td><td align="left" valign="top">958</td><td align="left" valign="top">93</td><td align="left" valign="top">40</td><td align="left" valign="top">43</td></tr><tr><td align="left" valign="top">N (NLP present)</td><td align="left" valign="top">288</td><td align="left" valign="top">99</td><td align="left" valign="top">53</td><td align="left" valign="top">54</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>NLP: natural language processing.</p></fn><fn id="table3fn2"><p><sup>b</sup>ICD: International Classification of Disease codes.</p></fn><fn id="table3fn3"><p><sup>c</sup>PWUD: people who use drugs.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><p>Our study augments previous work by integrating NLP with diverse identification methods, including urine toxicology and medication records, while simultaneously addressing observed demographic disparities in documentation [<xref ref-type="bibr" rid="ref23">23</xref>]. NLP has the potential to uncover hospital encounters with PWUD that may have previously been missed. Although NLP had greater PPV than diagnostic codes, its PPV remained low. We found that PWUD from racially and ethnically minoritized communities and those who had low income were more likely to be represented in the minimally documented cohort (ie, entry with NLP-only), rather than the maximally documented cohort.</p><p>Largely a result of stigma and racism, PWUD still do not have universal access to evidence-based treatment. Black PWUD tend to enter treatment with a more severe prognosis compared to their White counterparts, partly due to economic barriers in accessing treatment earlier [<xref ref-type="bibr" rid="ref33">33</xref>]. Black, Latino, and Native American individuals also face additional challenges in accessing treatment for SUD due to geographic barriers, health care access, and potential community characteristics or rapport with clinicians [<xref ref-type="bibr" rid="ref34">34</xref>]. We found that such a lack of rapport may be represented at the level of documentation for SUD; lack of SUD documentation was strongly associated with racially or ethnically minoritized identity (aOR=2.07).</p><p>Identification of PWUD who access medical care is important for several reasons. Best practice guidelines for hospitalized PWUD include management of substance use disorder, pain, and acute infection, testing and management for HIV and HCV, vaccinations for hepatitis or other relevant infections, and prevention of HIV with medications [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. In this study, we applied NLP retrospectively. Following previous studies that identified low HIV testing rates, we plan to use NLP to augment PWUD cohort creation in a study examining patterns of HIV testing [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. NLP could indeed become a valuable tool for identifying PWUD before discharge, facilitating intervention during hospitalization if EMRs could use NLP to trigger clinical decision support tools that trigger clinicians to consider SUD treatment, prescribe overdose prevention medications at discharge, order labs to prepare for pre-exposure prophylaxis, or offer vaccine services.</p><p>As we consider this study in the larger context of improving health equity, we believe that the next step would be refining the NLP system by adding more keywords, including and excluding certain conditions and medications, and conducting analyses on false positives and false negative cases. This study should be replicated in other medical centers across the United States; its wider application across various hospitals, encapsulating diverse populations and regions, will be instrumental. This study also has multifaceted applications, spanning epidemiological tracking, optimizing hospital resource utilization, and influencing the design of specific interventional studies. This study&#x2019;s findings could serve as a launchpad for integrated care for PWUD with less prejudice and inequity. ReGex is a relatively fundamental AI technology, and as more advanced NLP tools become available, we envision our methodology being expanded alongside these too. Regardless of type and complexity of NLP technology, the cohorting and comparative analysis outlined in this paper can be used as a framework to assess the NLP&#x2019;s performance against conventional ways of locating PWUD.</p><p>This study is not without its limitations. The NLP system, despite its effectiveness, occasionally misidentifies certain keywords. The constant calibration of the algorithm and frequent addition of keywords is needed to optimize and sustain accuracy. There are potential flaws in our characterization of domains; limitations include false positives from using &#x2019;amphetamine&#x2019; as a keyword, which unintentionally classified patients prescribed amphetamines for attention-deficit/hyperactivity disorder as PWUD. Similarly, methadone prescribed for pain management in conditions such as sickle cell disease was misclassified as OUD treatment. Achieving a balance between NLP&#x2019;s inclusivity and exclusivity presents a significant challenge for this purpose. Future steps should include evaluating the NLP system&#x2019;s sensitivity and specificity and iterating on the model to enhance these metrics. This will involve refining the keyword list for PWUD, enhancing the NLP algorithm to better account for common confounding variables. The field of addiction medicine is innovative and adaptive; to make NLP a meaningful clinical or research tool in this field, the NLP systems need to receive extensive training and constant input of nuanced decision-making that clinicians partake in daily. Thus, a feedback mechanism and fine-tuning to train the NLP model based on clinician feedback would be critical, fully leveraging repetitive learning, which is one of AI&#x2019;s biggest strengths. Furthermore, the single-cohort design of the study may limit generalizability; therefore, future studies with streamlined cross-institutional protocols, allowing simultaneous data collection from diverse locations, would improve external validity. This study had a particular focus on comparing diagnostic codes and NLP as single identifiers of PWUD. While NLP identified PWUD with higher PPV than the diagnostic codes, it must be noted that diagnostic criteria still exceeded NLP in the actual number of PWUD cases identified. One major purpose of NLP in PWUD identification is to identify cases that are otherwise missed in conventional screenings; thus, the fact that NLP alone identified a comparable number of PWUD to diagnostic code, with a higher predictive rate, is still remarkable. Future investigation should include a more robust performance comparison between a combination of two or more PWUD clinical identification tools.</p><p>The ethics of improving identification of PWUD requires careful consideration. Medical records indicating drug use may become a source of discrimination, compromise job security, housing, and ability to care for family. To mitigate these risks, institutions should implement strict policies ensuring that NLP findings are used solely for improving patient care. Members of this research team collaborated with a broad group of experts including people with lived experience of SUD on a study outlining some of the potential pros and cons of improving systems to identify PWUD with the creation of an additional <italic>ICD-10</italic> code for injection drug use [<xref ref-type="bibr" rid="ref37">37</xref>]. Future work should proactively incorporate the perspectives of individuals with lived experience of SUD. Furthermore, broader discussion regarding AI&#x2019;s role in health care is needed for effective, ethical, and productive clinical implementation: &#x201C;Should NLP be a &#x201C;wide net&#x201D; or &#x201C;precision tool&#x201D; when locating PWUD and connecting them to the care they need?&#x201D;</p><p>Despite these limitations, we believe that this study helps frame the future of systems for measuring health care delivery to PWUD. Hospitalization represents a crucial opportunity when nonjudgmental, trauma-informed, culturally competent care can be offered to PWUD. This presents many potential applications for NLP to be built into systems that track epidemiology and inform quality improvement and implementation science. By integrating NLP, we can advance equitable PWUD care.</p></sec></body><back><ack><p>Funding was provided by the Tufts CTSI Small Grants to Advance Translational Science (S-GATS) Program.</p></ack><fn-group><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">aOR</term><def><p>adjusted odds ratio</p></def></def-item><def-item><term id="abb3">EMR</term><def><p>electronic medical record</p></def></def-item><def-item><term id="abb4">HCV</term><def><p>hepatitis C virus</p></def></def-item><def-item><term id="abb5">ICD</term><def><p>International Classification of Disease codes</p></def></def-item><def-item><term id="abb6">NLP</term><def><p>natural language processing</p></def></def-item><def-item><term id="abb7">OUD</term><def><p>opioid use disorder</p></def></def-item><def-item><term id="abb8">PPV</term><def><p>positive predictive value</p></def></def-item><def-item><term id="abb9">PWUD</term><def><p>people who use drugs</p></def></def-item><def-item><term id="abb10">RegEx</term><def><p>regular expression</p></def></def-item><def-item><term id="abb11">SUD</term><def><p>substance use disorder</p></def></def-item><def-item><term id="abb12">SVI</term><def><p>social variability index</p></def></def-item><def-item><term id="abb13">TuftsMC</term><def><p>Tufts Medical Center</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chiosi</surname><given-names>JJ</given-names> </name><name name-style="western"><surname>Mueller</surname><given-names>PP</given-names> </name><name name-style="western"><surname>Chhatwal</surname><given-names>J</given-names> </name><name name-style="western"><surname>Ciaranello</surname><given-names>AL</given-names> </name></person-group><article-title>A multimorbidity model for estimating health outcomes from the syndemic of injection drug use and associated infections in the United States</article-title><source>BMC Health Serv Res</source><year>2023</year><month>07</month><day>17</day><volume>23</volume><issue>1</issue><fpage>760</fpage><pub-id pub-id-type="doi">10.1186/s12913-023-09773-1</pub-id><pub-id pub-id-type="medline">37461007</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mattson</surname><given-names>CL</given-names> </name><name name-style="western"><surname>Tanz</surname><given-names>LJ</given-names> </name><name name-style="western"><surname>Quinn</surname><given-names>K</given-names> </name><name name-style="western"><surname>Kariisa</surname><given-names>M</given-names> </name><name name-style="western"><surname>Patel</surname><given-names>P</given-names> </name><name name-style="western"><surname>Davis</surname><given-names>NL</given-names> </name></person-group><article-title>Trends and geographic patterns in drug and synthetic opioid overdose deaths - United States, 2013-2019</article-title><source>MMWR Morb Mortal Wkly Rep</source><year>2021</year><month>02</month><day>12</day><volume>70</volume><issue>6</issue><fpage>202</fpage><lpage>207</lpage><pub-id pub-id-type="doi">10.15585/mmwr.mm7006a4</pub-id><pub-id pub-id-type="medline">33571180</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sun</surname><given-names>J</given-names> </name><name name-style="western"><surname>Mehta</surname><given-names>SH</given-names> </name><name name-style="western"><surname>Astemborski</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Mortality among people who inject drugs: a prospective cohort followed over three&#x2009;decades in Baltimore, MD, USA</article-title><source>Addiction</source><year>2022</year><month>03</month><volume>117</volume><issue>3</issue><fpage>646</fpage><lpage>655</lpage><pub-id pub-id-type="doi">10.1111/add.15659</pub-id><pub-id pub-id-type="medline">34338374</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hollander</surname><given-names>MAG</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>CCH</given-names> </name><name name-style="western"><surname>Douaihy</surname><given-names>AB</given-names> </name><name name-style="western"><surname>Hulsey</surname><given-names>E</given-names> </name><name name-style="western"><surname>Donohue</surname><given-names>JM</given-names> </name></person-group><article-title>Racial inequity in medication treatment for opioid use disorder: exploring potential facilitators and barriers to use</article-title><source>Drug Alcohol Depend</source><year>2021</year><month>10</month><day>1</day><volume>227</volume><fpage>108927</fpage><pub-id pub-id-type="doi">10.1016/j.drugalcdep.2021.108927</pub-id><pub-id pub-id-type="medline">34358766</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hamdan</surname><given-names>S</given-names> </name><name name-style="western"><surname>Smyth</surname><given-names>E</given-names> </name><name name-style="western"><surname>Murphy</surname><given-names>ME</given-names> </name><etal/></person-group><article-title>Racial and ethnic disparities in HIV testing in people who use drugs admitted to a tertiary care hospital</article-title><source>AIDS Patient Care STDS</source><year>2022</year><month>11</month><volume>36</volume><issue>11</issue><fpage>425</fpage><lpage>430</lpage><pub-id pub-id-type="doi">10.1089/apc.2022.0165</pub-id><pub-id pub-id-type="medline">36301195</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Westgard</surname><given-names>LK</given-names> </name><name name-style="western"><surname>Sato</surname><given-names>T</given-names> </name><name name-style="western"><surname>Bradford</surname><given-names>WS</given-names> </name><etal/></person-group><article-title>National HIV and HCV screening rates for hospitalized people who use drugs are suboptimal and heterogeneous across 11 US hospitals</article-title><source>Open Forum Infect Dis</source><year>2024</year><month>05</month><volume>11</volume><issue>5</issue><fpage>ofae204</fpage><pub-id pub-id-type="doi">10.1093/ofid/ofae204</pub-id><pub-id pub-id-type="medline">38746950</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ti</surname><given-names>Lianping</given-names> </name><name name-style="western"><surname>Ti</surname><given-names>Lianlian</given-names> </name></person-group><article-title>Leaving the hospital against medical advice among people who use illicit drugs: a systematic review</article-title><source>Am J Public Health</source><year>2015</year><month>12</month><volume>105</volume><issue>12</issue><fpage>e53</fpage><lpage>9</lpage><pub-id pub-id-type="doi">10.2105/AJPH.2015.302885</pub-id><pub-id pub-id-type="medline">26469651</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hazen</surname><given-names>A</given-names> </name><name name-style="western"><surname>Pizzicato</surname><given-names>L</given-names> </name><name name-style="western"><surname>Hom</surname><given-names>J</given-names> </name><name name-style="western"><surname>Johnson</surname><given-names>C</given-names> </name><name name-style="western"><surname>Viner</surname><given-names>KM</given-names> </name></person-group><article-title>Association between discharges against medical advice and readmission in patients treated for drug injection-related skin and soft tissue infections</article-title><source>J Subst Abuse Treat</source><year>2021</year><month>07</month><volume>126</volume><fpage>108465</fpage><pub-id pub-id-type="doi">10.1016/j.jsat.2021.108465</pub-id><pub-id pub-id-type="medline">34116815</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Eaton</surname><given-names>EF</given-names> </name><name name-style="western"><surname>Westfall</surname><given-names>AO</given-names> </name><name name-style="western"><surname>McClesky</surname><given-names>B</given-names> </name><etal/></person-group><article-title>In-Hospital illicit drug use and patient-directed discharge: barriers to care for patients with injection-related infections</article-title><source>Open Forum Infect Dis</source><year>2020</year><month>03</month><volume>7</volume><issue>3</issue><fpage>ofaa074</fpage><pub-id pub-id-type="doi">10.1093/ofid/ofaa074</pub-id><pub-id pub-id-type="medline">32258203</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Calcaterra</surname><given-names>SL</given-names> </name><name name-style="western"><surname>Bottner</surname><given-names>R</given-names> </name><name name-style="western"><surname>Martin</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Management of opioid use disorder, opioid withdrawal, and opioid overdose prevention in hospitalized adults: A systematic review of existing guidelines</article-title><source>J Hosp Med</source><year>2022</year><month>09</month><volume>17</volume><issue>9</issue><fpage>679</fpage><lpage>692</lpage><pub-id pub-id-type="doi">10.1002/jhm.12908</pub-id><pub-id pub-id-type="medline">35880821</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Straub</surname><given-names>L</given-names> </name><name name-style="western"><surname>Gagne</surname><given-names>JJ</given-names> </name><name name-style="western"><surname>Maro</surname><given-names>JC</given-names> </name><etal/></person-group><article-title>Evaluation of use of technologies to facilitate medical chart review</article-title><source>Drug Saf</source><year>2019</year><month>09</month><volume>42</volume><issue>9</issue><fpage>1071</fpage><lpage>1080</lpage><pub-id pub-id-type="doi">10.1007/s40264-019-00838-x</pub-id><pub-id pub-id-type="medline">31111340</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schaper</surname><given-names>E</given-names> </name><name name-style="western"><surname>Padwa</surname><given-names>H</given-names> </name><name name-style="western"><surname>Urada</surname><given-names>D</given-names> </name><name name-style="western"><surname>Shoptaw</surname><given-names>S</given-names> </name></person-group><article-title>Substance use disorder patient privacy and comprehensive care in integrated health care settings</article-title><source>Psychol Serv</source><year>2016</year><month>02</month><volume>13</volume><issue>1</issue><fpage>105</fpage><lpage>109</lpage><pub-id pub-id-type="doi">10.1037/a0037968</pub-id><pub-id pub-id-type="medline">26845493</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Saczynski</surname><given-names>JS</given-names> </name><name name-style="western"><surname>Andrade</surname><given-names>SE</given-names> </name><name name-style="western"><surname>Harrold</surname><given-names>LR</given-names> </name><etal/></person-group><article-title>A systematic review of validated methods for identifying heart failure using administrative data</article-title><source>Pharmacoepidemiol Drug Saf</source><year>2012</year><month>01</month><volume>21 Suppl 1</volume><issue>1</issue><fpage>129</fpage><lpage>140</lpage><pub-id pub-id-type="doi">10.1002/pds.2313</pub-id><pub-id pub-id-type="medline">22262599</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Segar</surname><given-names>MW</given-names> </name><name name-style="western"><surname>Keshvani</surname><given-names>N</given-names> </name><name name-style="western"><surname>Rao</surname><given-names>S</given-names> </name><name name-style="western"><surname>Fonarow</surname><given-names>GC</given-names> </name><name name-style="western"><surname>Das</surname><given-names>SR</given-names> </name><name name-style="western"><surname>Pandey</surname><given-names>A</given-names> </name></person-group><article-title>Race, social determinants of health, and length of stay among hospitalized patients with heart failure: an analysis from the Get With The Guidelines-Heart Failure Registry</article-title><source>Circ: Heart Failure</source><year>2022</year><month>11</month><volume>15</volume><issue>11</issue><pub-id pub-id-type="doi">10.1161/CIRCHEARTFAILURE.121.009401</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Campanile</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Silverman</surname><given-names>M</given-names> </name></person-group><article-title>Sensitivity, specificity and predictive values of ICD-10 substance use codes in a cohort of substance use-related endocarditis patients</article-title><source>Am J Drug Alcohol Abuse</source><year>2022</year><month>09</month><day>3</day><volume>48</volume><issue>5</issue><fpage>538</fpage><lpage>547</lpage><pub-id pub-id-type="doi">10.1080/00952990.2022.2047713</pub-id><pub-id pub-id-type="medline">35579599</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ball</surname><given-names>LJ</given-names> </name><name name-style="western"><surname>Sherazi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Laczko</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Validation of an algorithm to identify infective endocarditis in people who inject drugs</article-title><source>Med Care</source><year>2018</year><month>10</month><volume>56</volume><issue>10</issue><fpage>e70</fpage><lpage>e75</lpage><pub-id pub-id-type="doi">10.1097/MLR.0000000000000838</pub-id><pub-id pub-id-type="medline">29200131</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zalesak</surname><given-names>M</given-names> </name><name name-style="western"><surname>Francis</surname><given-names>K</given-names> </name><name name-style="western"><surname>Gedeon</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Current and future disease progression of the chronic HCV population in the United States</article-title><source>PLoS ONE</source><year>2013</year><volume>8</volume><issue>5</issue><fpage>e63959</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0063959</pub-id><pub-id pub-id-type="medline">23704962</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ehrenfeld</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Gottlieb</surname><given-names>KG</given-names> </name><name name-style="western"><surname>Beach</surname><given-names>LB</given-names> </name><name name-style="western"><surname>Monahan</surname><given-names>SE</given-names> </name><name name-style="western"><surname>Fabbri</surname><given-names>D</given-names> </name></person-group><article-title>Development of a natural language processing algorithm to identify and evaluate transgender patients in electronic health record systems</article-title><source>Ethn Dis</source><year>2019</year><volume>29</volume><issue>Suppl 2</issue><fpage>441</fpage><lpage>450</lpage><pub-id pub-id-type="doi">10.18865/ed.29.S2.441</pub-id><pub-id pub-id-type="medline">31308617</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sims</surname><given-names>SA</given-names> </name><name name-style="western"><surname>Snow</surname><given-names>LA</given-names> </name><name name-style="western"><surname>Porucznik</surname><given-names>CA</given-names> </name></person-group><article-title>Surveillance of methadone-related adverse drug events using multiple public health data sources</article-title><source>J Biomed Inform</source><year>2007</year><month>08</month><volume>40</volume><issue>4</issue><fpage>382</fpage><lpage>389</lpage><pub-id pub-id-type="doi">10.1016/j.jbi.2006.10.004</pub-id><pub-id pub-id-type="medline">17185042</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ridgway</surname><given-names>JP</given-names> </name><name name-style="western"><surname>Uvin</surname><given-names>A</given-names> </name><name name-style="western"><surname>Schmitt</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Natural language processing of clinical notes to identify mental illness and substance use among people living with HIV: retrospective cohort study</article-title><source>JMIR Med Inform</source><year>2021</year><month>03</month><day>10</day><volume>9</volume><issue>3</issue><fpage>e23456</fpage><pub-id pub-id-type="doi">10.2196/23456</pub-id><pub-id pub-id-type="medline">33688848</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bui</surname><given-names>DDA</given-names> </name><name name-style="western"><surname>Zeng-Treitler</surname><given-names>Q</given-names> </name></person-group><article-title>Learning regular expressions for clinical text classification</article-title><source>J Am Med Inform Assoc</source><year>2014</year><volume>21</volume><issue>5</issue><fpage>850</fpage><lpage>857</lpage><pub-id pub-id-type="doi">10.1136/amiajnl-2013-002411</pub-id><pub-id pub-id-type="medline">24578357</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Almudaifer</surname><given-names>AI</given-names> </name><name name-style="western"><surname>Covington</surname><given-names>W</given-names> </name><name name-style="western"><surname>Hairston</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Multi-task transfer learning for the prediction of entity modifiers in clinical text: application to opioid use disorder case detection</article-title><source>J Biomed Semantics</source><year>2024</year><month>06</month><day>7</day><volume>15</volume><issue>1</issue><fpage>11</fpage><pub-id pub-id-type="doi">10.1186/s13326-024-00311-4</pub-id><pub-id pub-id-type="medline">38849884</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Goodman-Meza</surname><given-names>D</given-names> </name><name name-style="western"><surname>Tang</surname><given-names>A</given-names> </name><name name-style="western"><surname>Aryanfar</surname><given-names>B</given-names> </name><etal/></person-group><article-title>Natural language processing and machine learning to identify people who inject drugs in electronic health records</article-title><source>Open Forum Infect Dis</source><year>2022</year><month>09</month><volume>9</volume><issue>9</issue><fpage>ofac471</fpage><pub-id pub-id-type="doi">10.1093/ofid/ofac471</pub-id><pub-id pub-id-type="medline">36168546</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bartholomew</surname><given-names>TS</given-names> </name><name name-style="western"><surname>Tookes</surname><given-names>HE</given-names> </name><name name-style="western"><surname>Spencer</surname><given-names>EC</given-names> </name><name name-style="western"><surname>Feaster</surname><given-names>DJ</given-names> </name></person-group><article-title>Application of machine learning algorithms for localized syringe services program policy implementation &#x2013; Florida, 2017</article-title><source>Ann Med</source><year>2022</year><month>12</month><day>31</day><volume>54</volume><issue>1</issue><fpage>2137</fpage><lpage>2150</lpage><pub-id pub-id-type="doi">10.1080/07853890.2022.2105391</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cresta Morgado</surname><given-names>P</given-names> </name><name name-style="western"><surname>Carusso</surname><given-names>M</given-names> </name><name name-style="western"><surname>Alonso Alemany</surname><given-names>L</given-names> </name><name name-style="western"><surname>Acion</surname><given-names>L</given-names> </name></person-group><article-title>Practical foundations of machine learning for addiction research. Part I. Methods and techniques</article-title><source>Am J Drug Alcohol Abuse</source><year>2022</year><month>05</month><day>4</day><volume>48</volume><issue>3</issue><fpage>260</fpage><lpage>271</lpage><pub-id pub-id-type="doi">10.1080/00952990.2021.1995739</pub-id><pub-id pub-id-type="medline">35389305</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rivero-Ju&#x00E1;rez</surname><given-names>A</given-names> </name><name name-style="western"><surname>Guijo-Rubio</surname><given-names>D</given-names> </name><name name-style="western"><surname>Tellez</surname><given-names>F</given-names> </name><etal/></person-group><article-title>Using machine learning methods to determine a typology of patients with HIV-HCV infection to be treated with antivirals</article-title><source>PLoS ONE</source><year>2020</year><volume>15</volume><issue>1</issue><fpage>e0227188</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0227188</pub-id><pub-id pub-id-type="medline">31923277</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>D Grussing</surname><given-names>E</given-names> </name><name name-style="western"><surname>Pickard</surname><given-names>B</given-names> </name><name name-style="western"><surname>Khalid</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Implementation of a bundle to improve HIV testing during hospitalization for people who inject drugs</article-title><source>Implement Res Pract</source><year>2023</year><volume>4</volume><fpage>26334895231203410</fpage><pub-id pub-id-type="doi">10.1177/26334895231203410</pub-id><pub-id pub-id-type="medline">37936964</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wurcel</surname><given-names>AG</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>S</given-names> </name><name name-style="western"><surname>Burke</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Implementation of a patient-provider agreement to improve healthcare delivery for patients with substance use disorder in the inpatient setting</article-title><source>J Patient Saf</source><year>2021</year><month>12</month><day>1</day><volume>17</volume><issue>8</issue><fpage>e1827</fpage><lpage>e1832</lpage><pub-id pub-id-type="doi">10.1097/PTS.0000000000000721</pub-id><pub-id pub-id-type="medline">32398540</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Reed</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Jordan</surname><given-names>AE</given-names> </name><name name-style="western"><surname>Perlman</surname><given-names>DC</given-names> </name><name name-style="western"><surname>Smith</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>Hagan</surname><given-names>H</given-names> </name></person-group><article-title>The HCV care continuum among people who use drugs: protocol for a systematic review and meta-analysis</article-title><source>Syst Rev</source><year>2016</year><month>07</month><day>11</day><volume>5</volume><issue>1</issue><fpage>110</fpage><pub-id pub-id-type="doi">10.1186/s13643-016-0293-6</pub-id><pub-id pub-id-type="medline">27401499</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hoffman</surname><given-names>KA</given-names> </name><name name-style="western"><surname>Ponce Terashima</surname><given-names>J</given-names> </name><name name-style="western"><surname>McCarty</surname><given-names>D</given-names> </name></person-group><article-title>Opioid use disorder and treatment: challenges and opportunities</article-title><source>BMC Health Serv Res</source><year>2019</year><month>11</month><day>25</day><volume>19</volume><issue>1</issue><fpage>884</fpage><pub-id pub-id-type="doi">10.1186/s12913-019-4751-4</pub-id><pub-id pub-id-type="medline">31767011</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>McGrew</surname><given-names>KM</given-names> </name><name name-style="western"><surname>Homco</surname><given-names>JB</given-names> </name><name name-style="western"><surname>Garwe</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Validity of International Classification of Diseases codes in identifying illicit drug use target conditions using medical record data as a reference standard: a systematic review</article-title><source>Drug Alcohol Depend</source><year>2020</year><month>03</month><day>1</day><volume>208</volume><fpage>107825</fpage><pub-id pub-id-type="doi">10.1016/j.drugalcdep.2019.107825</pub-id><pub-id pub-id-type="medline">31982637</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="web"><article-title>Social vulnerability index</article-title><source>ATSDR Place and Health - Geospatial Research, Analysis, and Services Program (GRASP)</source><year>2024</year><access-date>2025-07-09</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.atsdr.cdc.gov/place-health/php/svi/index.html">https://www.atsdr.cdc.gov/place-health/php/svi/index.html</ext-link></comment></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Matsuzaka</surname><given-names>S</given-names> </name><name name-style="western"><surname>Knapp</surname><given-names>M</given-names> </name></person-group><article-title>Anti-racism and substance use treatment: addiction does not discriminate, but do we?</article-title><source>J Ethn Subst Abuse</source><year>2020</year><volume>19</volume><issue>4</issue><fpage>567</fpage><lpage>593</lpage><pub-id pub-id-type="doi">10.1080/15332640.2018.1548323</pub-id><pub-id pub-id-type="medline">30642230</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Acevedo</surname><given-names>A</given-names> </name><name name-style="western"><surname>Panas</surname><given-names>L</given-names> </name><name name-style="western"><surname>Garnick</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Disparities in the treatment of substance use disorders: does where you live matter?</article-title><source>J Behav Health Serv Res</source><year>2018</year><month>10</month><volume>45</volume><issue>4</issue><fpage>533</fpage><lpage>549</lpage><pub-id pub-id-type="doi">10.1007/s11414-018-9586-y</pub-id><pub-id pub-id-type="medline">29435862</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Thakarar</surname><given-names>K</given-names> </name><name name-style="western"><surname>Weinstein</surname><given-names>ZM</given-names> </name><name name-style="western"><surname>Walley</surname><given-names>AY</given-names> </name></person-group><article-title>Optimising health and safety of people who inject drugs during transition from acute to outpatient care: narrative review with clinical checklist</article-title><source>Postgrad Med J</source><year>2016</year><month>06</month><volume>92</volume><issue>1088</issue><fpage>356</fpage><lpage>363</lpage><pub-id pub-id-type="doi">10.1136/postgradmedj-2015-133720</pub-id><pub-id pub-id-type="medline">27004476</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zubiago</surname><given-names>J</given-names> </name><name name-style="western"><surname>Murphy</surname><given-names>M</given-names> </name><name name-style="western"><surname>Guardado</surname><given-names>R</given-names> </name><name name-style="western"><surname>Daudelin</surname><given-names>D</given-names> </name><name name-style="western"><surname>Patil</surname><given-names>D</given-names> </name><name name-style="western"><surname>Wurcel</surname><given-names>A</given-names> </name></person-group><article-title>Increased HIV testing in people who use drugs hospitalized in the first wave of the COVID-19 pandemic</article-title><source>J Subst Abuse Treat</source><year>2021</year><month>05</month><volume>124</volume><fpage>108266</fpage><pub-id pub-id-type="doi">10.1016/j.jsat.2020.108266</pub-id><pub-id pub-id-type="medline">33771274</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sundaram</surname><given-names>G</given-names> </name><name name-style="western"><surname>Sato</surname><given-names>T</given-names> </name><name name-style="western"><surname>Goodman-Meza</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Perspectives on benefits and risks of creation of an &#x201C;injection drug use&#x201D; billing code</article-title><source>J Subst Use Addict Treat</source><year>2024</year><month>09</month><volume>164</volume><fpage>209392</fpage><pub-id pub-id-type="doi">10.1016/j.josat.2024.209392</pub-id><pub-id pub-id-type="medline">38735482</pub-id></nlm-citation></ref></ref-list></back></article>