<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="review-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR AI</journal-id><journal-id journal-id-type="publisher-id">ai</journal-id><journal-id journal-id-type="index">41</journal-id><journal-title>JMIR AI</journal-title><abbrev-journal-title>JMIR AI</abbrev-journal-title><issn pub-type="epub">2817-1705</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v5i1e77732</article-id><article-id pub-id-type="doi">10.2196/77732</article-id><article-categories><subj-group subj-group-type="heading"><subject>Review</subject></subj-group></article-categories><title-group><article-title>Application of Language Models for the Analysis of Adverse Drug Events in Pharmaceutical Research and Development: Scoping Review</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Schreier</surname><given-names>Oren</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Yazdani</surname><given-names>Anthony</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Galdadas</surname><given-names>Ioannis</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kabak</surname><given-names>Ryme</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Gervasio</surname><given-names>Francesco Luigi</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Mu</surname><given-names>Gang</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff7">7</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Teodoro</surname><given-names>Douglas</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Radiology and Medical Informatics, Faculty of Medicine, University of Geneva</institution><addr-line>Chemin des Mines 9</addr-line><addr-line>Geneva</addr-line><country>Switzerland</country></aff><aff id="aff2"><institution>School of Pharmaceutical Sciences, University of Geneva</institution><addr-line>Geneva</addr-line><country>Switzerland</country></aff><aff id="aff3"><institution>Institute of Pharmaceutical Sciences of Western Switzerland (ISPSO), University of Geneva</institution><addr-line>Geneva</addr-line><country>Switzerland</country></aff><aff id="aff4"><institution>Swiss Institute of Bioinformatics, University of Geneva</institution><addr-line>Geneva</addr-line><country>Switzerland</country></aff><aff id="aff5"><institution>Johnson &#x0026; Johnson World Headquarters</institution><addr-line>Bridgewater</addr-line><addr-line>NJ</addr-line><country>United States</country></aff><aff id="aff6"><institution>Department of Chemistry, University College London</institution><addr-line>London</addr-line><addr-line>England</addr-line><country>United Kingdom</country></aff><aff id="aff7"><institution>Cilag GmbH International</institution><addr-line>Zug</addr-line><country>Switzerland</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Raisaro</surname><given-names>Jean-Louis</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Shah</surname><given-names>Syed Ahtisham Mehmood</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Sakar</surname><given-names>Urmimala</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Douglas Teodoro, PhD, Department of Radiology and Medical Informatics, Faculty of Medicine, University of Geneva, Chemin des Mines 9, Geneva, 1202, Switzerland, 41 0223790225; <email>Douglas.Teodoro@unige.ch</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>16</day><month>6</month><year>2026</year></pub-date><volume>5</volume><elocation-id>e77732</elocation-id><history><date date-type="received"><day>23</day><month>05</month><year>2025</year></date><date date-type="rev-recd"><day>30</day><month>01</month><year>2026</year></date><date date-type="accepted"><day>07</day><month>03</month><year>2026</year></date></history><copyright-statement>&#x00A9; Oren Schreier, Anthony Yazdani, Ioannis Galdadas, Ryme Kabak, Francesco Luigi Gervasio, Gang Mu, Douglas Teodoro. Originally published in JMIR AI (<ext-link ext-link-type="uri" xlink:href="https://ai.jmir.org">https://ai.jmir.org</ext-link>), 16.6.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR AI, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.ai.jmir.org/">https://www.ai.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://ai.jmir.org/2026/1/e77732"/><abstract><sec><title>Background</title><p>Adverse drug events (ADEs) remain a critical safety issue in pharmaceutical research and development (Pharma R&#x0026;D), necessitating robust methods for early detection and surveillance. Language models (LMs) are increasingly used in ADE analysis, addressing safety challenges during drug development and postmarket surveillance. Language modeling approaches, ranging from static embeddings to large language models (LLMs), capitalize on diverse data sources, such as clinical trial datasets, electronic health records, and social media posts, to predict ADEs, analyze real-world evidence, and improve drug screening and pharmacovigilance systems.</p></sec><sec><title>Objective</title><p>This scoping review aims to map the application of LMs for the analysis of ADEs across the Pharma R&#x0026;D lifecycle.</p></sec><sec sec-type="methods"><title>Methods</title><p>Following the PRISMA-ScR (Preferred Reporting Items for Systematic Reviews and Meta-Analyses Extension for Scoping Reviews) guidelines, we searched PubMed, Web of Science, and Google Scholar for relevant papers published between January 2015 and October 2025.</p></sec><sec sec-type="results"><title>Results</title><p>This review identified 49 relevant papers. Overall, LM applications in Pharma R&#x0026;D safety analysis are concentrated in 2 distinct phases: ADE prediction during the premarket phase (n=16) and ADE detection in postmarket surveillance (n=33).</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>While some models demonstrate high predictive performance, persistent challenges, including data heterogeneity and limited external validation, hinder widespread adoption. Despite these barriers, discriminative and generative LMs have the potential to transform drug safety across the pre- and postapproval phases, especially when integrated with real-world pharmacovigilance frameworks.</p></sec></abstract><kwd-group><kwd>adverse drug events</kwd><kwd>artificial intelligence</kwd><kwd>language models</kwd><kwd>drug development</kwd><kwd>pharmacovigilance</kwd><kwd>pharmaceutical research</kwd><kwd>risk assessment</kwd><kwd>information extraction</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Adverse drug events (ADEs), injuries caused by the use or misuse of medications, pose a major challenge throughout the entire drug development lifecycle [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. It is estimated that over 30% of drug candidates are discarded owing to toxicity, even after they are launched on the market [<xref ref-type="bibr" rid="ref4">4</xref>]. High rates of ADEs have significant consequences for patient safety and health care systems. For example, in the postmarket setting, the prevalence of adverse drug reactions among hospitalized older adults is 22%; yet, 60% are preventable cases largely driven by predictable factors such as polypharmacy and complex comorbidities [<xref ref-type="bibr" rid="ref5">5</xref>]. Catastrophic drug safety failures like the thalidomide disaster of 1961, which caused severe birth defects in thousands of infants, underscored the need for rigorous pharmacovigilance. These concerns highlight the importance of early detection and prediction of ADEs across the entire drug development lifecycle, from preclinical testing to phase IV clinical trials.</p><p>The identification of new ADEs caused by a drug product is one of the key activities in the pharmaceutical industry to ensure the safety profile of a drug product. However, assessing the safety of a drug well before it reaches the market is not always straightforward. Drug candidates that appear safe in preclinical stages can exhibit toxicity in clinical phases, leading to high failure rates. One contributing factor to this attrition is the discrepancy between animal models used in preclinical screenings and human biology, where preclinical safety data fail to predict human reactions [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. Consequently, ADEs, including treatment-related fatalities, can emerge even during controlled clinical trials [<xref ref-type="bibr" rid="ref9">9</xref>]. Since premarket testing cannot always guarantee safety, rigorous phase IV surveillance remains essential to identify risks once the drug enters the broader population. Postmarket monitoring relies heavily on spontaneous reporting systems. However, these systems are known to substantially undercount true ADEs [<xref ref-type="bibr" rid="ref10">10</xref>], notably due to limited clinician time and the complexity of reporting workflows [<xref ref-type="bibr" rid="ref11">11</xref>].</p><p>In the modern era, the volume and variety of drug safety data have grown significantly, encompassing not only structured sources, such as trial registries and spontaneous reporting systems, but also diverse real-world data streams, including electronic health records (EHRs) and social media data [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. This abundance of data has outpaced traditional surveillance approaches and created a need for automated methods to monitor drug safety signals. Machine learning (ML) has the potential to assist with signal detection and supplement traditional pharmacovigilance surveillance methods [<xref ref-type="bibr" rid="ref14">14</xref>] due to its capacity for multimodal and large-scale data processing. Among the different ML approaches, language models (LMs) have emerged as a versatile technology for addressing such safety challenges, mostly given their ability to process extremely diverse data, where safety risks can be found in unstructured human language text, such as physician notes, biomedical literature, and social media posts, or encoded in chemical language, where molecular structures are represented as text sequences. Consequently, the field of LMs for drug safety has witnessed a methodological evolution over the last decade. While earlier approaches relied on static representations, recent years have seen a shift toward contextualized architectures and generative Large Language Models (LLMs) [<xref ref-type="bibr" rid="ref15">15</xref>]. These advancements have enabled diverse analyses, ranging from extracting ADE mentions in patient forums to predicting complex toxicity endpoints based solely on molecular formulations.</p><p>Several reviews concerning the use of artificial intelligence (AI) to analyze ADEs are already available, although these sources either miss current developments in LMs or only focus on a specific aspect. In particular, the application of AI to ADE prediction has already been the subject of 3 scoping and 2 systematic reviews between 2022 and 2025 (<xref ref-type="table" rid="table1">Table 1</xref>). Syrowatka et al [<xref ref-type="bibr" rid="ref16">16</xref>], in their scoping review, discuss a series of use cases to identify the most promising areas in which AI can be used to reduce the frequency of ADEs, but exclude studies that included postmarket surveillance. Yang and Kar [<xref ref-type="bibr" rid="ref17">17</xref>] cover a much broader area of the different aspects that contribute to the resulting ADEs, with a strong focus on toxicity prediction, and discuss how AI and ML techniques can be applied in this area. The work of Denck et al [<xref ref-type="bibr" rid="ref18">18</xref>] highlights the ability of AI or ML to analyze large datasets and identify complex patterns in observational health data, thereby improving drug safety and pharmacovigilance. It also discusses limitations, such as the need for high-quality data and the challenges of model interpretability and generalizability. Although the scoping review by Hu et al [<xref ref-type="bibr" rid="ref19">19</xref>] focuses on AI methods that use EHR to predict ADEs, the use of only 10 studies limits the generalizability of their observations. Finally, Teodoro et al [<xref ref-type="bibr" rid="ref20">20</xref>] review diverse AI algorithms for safety, efficacy, and operational risks in clinical trials, noting the recent emergence of LLMs. However, their broad focus on general ML and multiple risk categories limits their specific analysis of LMs applied to safety in the pharmaceutical research and development (Pharma R&#x0026;D) lifecycle.</p><p>Distinct from existing reviews, our scoping review focuses on the application of LMs across the entire Pharma R&#x0026;D pipeline, from preclinical discovery to postmarket surveillance. Our goal is to present a comprehensive layout of how LMs serve as a unifying technology, bridging the methodological gap between premarket toxicity prediction and postmarket surveillance. By covering the time frame from 2015 to October 2025, we capture the technological shift from static embeddings (eg, word2vec) to the emergence of LLMs. Through this analysis, we aim to map recent methodological developments and key trends, but also highlight future research directions based on the outstanding challenges of current approaches. To this end, we address the following research questions:</p><list list-type="bullet"><list-item><p>RQ1: For which organs and toxicity endpoints are LMs used for in safety analysis?</p></list-item><list-item><p>RQ2: What types of LMs have been used to analyze safety risks in drug design and development?</p></list-item><list-item><p>RQ3: What are the data sources and metrics used for training and evaluating LM methods for safety assessment in Pharma R&#x0026;D?</p></list-item><list-item><p>RQ4: What are the current limitations of LM approaches for AI-based ADE analysis?</p></list-item></list><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Overview of existing literature.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Authors</td><td align="left" valign="bottom">Journal</td><td align="left" valign="bottom">Year</td><td align="left" valign="bottom">Scope</td></tr></thead><tbody><tr><td align="left" valign="top">Syrowatka et al [<xref ref-type="bibr" rid="ref16">16</xref>]</td><td align="left" valign="top"><italic>The Lancet Digital Health</italic></td><td align="left" valign="top">2022</td><td align="left" valign="top">ScR<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup>: ML<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup> and AI<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup> techniques for pharmacovigilance with a focus on detecting ADEs<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">Yang and Kar [<xref ref-type="bibr" rid="ref17">17</xref>]</td><td align="left" valign="top"><italic>Artificial Intelligence Chemistry</italic></td><td align="left" valign="top">2023</td><td align="left" valign="top">SR<sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup>: AI and ML methods and databases for early detection of ADEs and toxicity</td></tr><tr><td align="left" valign="top">Denck et al [<xref ref-type="bibr" rid="ref18">18</xref>]</td><td align="left" valign="top"><italic>Drug Discovery Today</italic></td><td align="left" valign="top">2023</td><td align="left" valign="top">SR: ML approaches for the prediction of ADEs from observational health data</td></tr><tr><td align="left" valign="top">Hu et al [<xref ref-type="bibr" rid="ref19">19</xref>]</td><td align="left" valign="top"><italic>Frontiers in Pharmacology</italic></td><td align="left" valign="top">2024</td><td align="left" valign="top">ScR: application of ML algorithms in predicting specific ADEs using EHR<sup><xref ref-type="table-fn" rid="table1fn6">f</xref></sup> data</td></tr><tr><td align="left" valign="top">Teodoro et al [<xref ref-type="bibr" rid="ref20">20</xref>]</td><td align="left" valign="top"><italic>npj Digital Medicine</italic></td><td align="left" valign="top">2025</td><td align="left" valign="top">ScR: a scoping review of AI applications in clinical trial risk assessment</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>ScR<italic>:</italic> scoping review.</p></fn><fn id="table1fn2"><p><sup>b</sup>ML: machine learning.</p></fn><fn id="table1fn3"><p><sup>c</sup>AI: artificial intelligence.</p></fn><fn id="table1fn4"><p><sup>d</sup>ADE: adverse drug event.</p></fn><fn id="table1fn5"><p><sup>e</sup>SR: systematic review.</p></fn><fn id="table1fn6"><p><sup>f</sup>EHR: electronic health record.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2" sec-type="methods"><title>Methods</title><p>Our systematic search covers peer-reviewed studies published in English between January 1, 2015, and October 15, 2025. Our selection process followed the PRISMA-ScR (Preferred Reporting Items for Systematic Reviews and Meta-Analyses Extension for Scoping Reviews) guidelines (<xref ref-type="supplementary-material" rid="app1">Checklist 1</xref>).</p><sec id="s2-1"><title>Search Strategy and Study Selection</title><p>In the search phase, we used 3 major databases: PubMed, Web of Science, and Google Scholar. We queried databases for potentially relevant records using a broad range of keywords stratified into five groups: (1) Pharma R&#x0026;D, (2) drug-related terms, (3) ADE-related terms, (4) the type of algorithm that was used, and (5) the task that the algorithm was supposed to perform. We combined the keywords within each group using the OR operator, and all groups were combined using the AND operator. To search for papers, we applied the default settings of the respective databases using the title and abstract fields. <xref ref-type="table" rid="table2">Table 2</xref> contains the search keywords used in the process.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Keyword groups for the search strategy<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup>.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Group</td><td align="left" valign="bottom">Category</td><td align="left" valign="bottom">Keywords</td></tr></thead><tbody><tr><td align="left" valign="top">1</td><td align="left" valign="top">Pharma R&#x0026;D<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup>-related keywords</td><td align="left" valign="top">&#x201C;clinical research&#x201D; OR &#x201C;clinical trials&#x201D; OR &#x201C;pharmaceutical research&#x201D; OR &#x201C;pharmacological research&#x201D; OR &#x201C;pharmaceutical development&#x201D; OR &#x201C;drug design&#x201D; OR &#x201C;drug development&#x201D; OR &#x201C;pharmacovigilance&#x201D; OR &#x201C;event detection&#x201D;</td></tr><tr><td align="left" valign="top">2</td><td align="left" valign="top">Drug-related keywords</td><td align="left" valign="top">&#x201C;drug&#x201D; OR &#x201C;compound&#x201D; OR &#x201C;substance&#x201D;</td></tr><tr><td align="left" valign="top">3</td><td align="left" valign="top">Adverse drug event&#x2013;related keywords</td><td align="left" valign="top">&#x201C;adverse drug reaction&#x201D; OR &#x201C;adverse drug event&#x201D; OR &#x201C;toxicity&#x201D;</td></tr><tr><td align="left" valign="top">4</td><td align="left" valign="top">Machine learning keywords</td><td align="left" valign="top">&#x201C;artificial intelligence&#x201D; OR &#x201C;language model&#x201D; OR &#x201C;fuzzy&#x201D; OR &#x201C;rule-based&#x201D; OR &#x201C;machine learning&#x201D; OR &#x201C;support vector machine&#x201D; OR &#x201C;decision tree&#x201D; OR &#x201C;neural network&#x201D; OR &#x201C;deep learning&#x201D; OR &#x201C;text mining&#x201D; OR &#x201C;natural language processing&#x201D;</td></tr><tr><td align="left" valign="top">5</td><td align="left" valign="top">Task-related keywords</td><td align="left" valign="top">&#x201C;predict&#x201D; OR &#x201C;extract&#x201D; OR &#x201C;detect&#x201D; OR &#x201C;classify&#x201D;</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>The final query included all the described groups.</p></fn><fn id="table2fn2"><p><sup>b</sup>Pharma R&#x0026;D: pharmaceutical research and development.</p></fn></table-wrap-foot></table-wrap><p>To ensure relevance, we applied specific inclusion and exclusion criteria, as reported in <xref ref-type="other" rid="box1">Textbox 1</xref>, namely papers written in English, with ADEs as the main topic, involving mammalian species, and published in peer-reviewed journals or conference proceedings between January 1, 2015, and October 15, 2025. To focus on the recent trend in the AI field, we excluded papers that did not use LMs in their modeling approach.</p><boxed-text id="box1"><title> Criteria for including and excluding studies.</title><p><bold>Inclusion criteria</bold></p><list list-type="bullet"><list-item><p>Adverse drug events are the main topic of the paper</p></list-item><list-item><p>Basic research</p></list-item><list-item><p>Peer-reviewed papers published in journals and conferences</p></list-item><list-item><p>English language</p></list-item><list-item><p>Publication date between January 1, 2015, and October 15, 2025</p></list-item><list-item><p>All papers retrieved in PubMed and Web of Science, and the top 188 papers in Google Scholar</p></list-item></list><p><bold>Exclusion criteria</bold></p><list list-type="bullet"><list-item><p>Risk factor analyses</p></list-item><list-item><p>Nonlanguage modeling algorithms</p></list-item><list-item><p>Nonpharmacological treatment</p></list-item><list-item><p>Adverse drug events in nonmammalian species</p></list-item><list-item><p>Clinical application (as opposed to pharmaceutical research and development)</p></list-item><list-item><p>Cross-drug interaction (polypharmacy)</p></list-item></list></boxed-text></sec><sec id="s2-2"><title>Dataset Screening and Annotation</title><p>Three researchers (OS, AY, and DT) independently screened the titles and abstracts. The resulting set was cross-checked by IG and RK. Then, OS, AY, IG, RK, and DT read the full texts independently and extracted item information using a standard spreadsheet created before the analysis in line with the research questions. Any differences in including or excluding full-text studies were resolved during a consensus meeting. The final dataset was based on the CHARMS (Critical Appraisal and Data Extraction for Systematic Reviews of Prediction Modeling Studies) checklist and includes the publication date, whether the study was published in a journal or a conference, country of the corresponding author, source of data used, task formulation, toxicity endpoints that were predicted, affected organ, metrics of performance evaluation, the algorithm used, the nature of the algorithm used, the type of LM, the features that were used for the modeling, and the drug design and development stage.</p></sec><sec id="s2-3"><title>Data Analysis</title><p>We analyzed the data using Microsoft Excel for Mac (Microsoft Office 365, version 16.69). We used descriptive statistics like frequencies and ranges and presented the data graphically and in tabular format, as needed.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Overview</title><p>The search query resulted in 1397 records from PubMed (n=695), Web of Science (n=514), and Google Scholar (n=188), which, after removing duplicates (n=503), and performing a &#x201C;title &#x0026; abstract&#x201D; screening (n=894; n=836 records excluded), and a full-text eligibility assessment (n=58; n=9 records excluded), were narrowed down to 49 records included for analysis. Our study selection flowchart is shown in <xref ref-type="fig" rid="figure1">Figure 1</xref>.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>PRISMA flowchart describing the different literature sources used, and the selection process followed to filter down the relevant sources that were used in the end (adapted from Page et al [<xref ref-type="bibr" rid="ref21">21</xref>], which is published under Creative Commons Attribution 4.0 International License [<xref ref-type="bibr" rid="ref22">22</xref>]). Only studies whose methodology involved LMs were included. DDI: drug-drug interaction; LM: language model; PRISMA: Preferred Reporting Items for Systematic Reviews and Meta-Analyses.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v5i1e77732_fig01.png"/></fig><p>This review covers studies published both in scientific journals (n=42) and conferences (n=7). Based on the corresponding author&#x2019;s affiliation, 11 of 49 papers are located in China, equaling the number in the United States (n=11), 5 in India, and 4 in Korea, followed by 12 other countries. The increased number of studies on this field over the past 10 years (<xref ref-type="fig" rid="figure2">Figure 2A</xref>) and the large geographical spread of the included studies highlight the growing global interest in developing AI algorithms based on LMs for Pharma R&#x0026;D safety risk assessment, as well as the potential for international collaborations in this regard. As we can note from <xref ref-type="fig" rid="figure2">Figure 2B</xref>, studies cover a large variety of tasks, including ADE-related information extraction from free text, such as named entity recognition (NER) (n=23) [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref23">23</xref>-<xref ref-type="bibr" rid="ref31">31</xref>], safety prediction based on molecular structure, such as toxicity prediction (n=13) [<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref35">35</xref>], and disproportionality analysis for signal detection (n=6) [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>-<xref ref-type="bibr" rid="ref39">39</xref>].</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>High-level overview of the studies included in the analyses. Trend of artificial intelligence algorithms developed to be used in a premarket or postmarket phase and categorized by (A) application of the algorithm over time, distinguishing premarket applications (red) and postmarket applications (blue) and (B) distribution of studies by task-level application, separating premarket (red) and postmarket (blue) use cases. ADE: adverse drug event; NER: named entity recognition.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v5i1e77732_fig02.png"/></fig><p>As shown in <xref ref-type="fig" rid="figure3">Figure 3</xref>, we can categorize AI applications for safety risk assessment in drug design and development into 2 main groups: safety prediction and ADE detection. These different applications are found across four of the five stages of drug design and development [<xref ref-type="bibr" rid="ref40">40</xref>]: (1) discovery and development, (2) preclinical research, (3) clinical research, (4) regulatory review, and (5) postmarket safety monitoring. Due to the challenge of specifying the exact stage that the study addresses, for simplicity, we grouped these 5 stages into 2: pharmaceutical research (premarket) and postmarket safety monitoring (postmarket). Premarket encompasses from stage 1 (discovery and development) to stage 3 (clinical research), including clinical trials from phase I to phase III, while the postmarket stage (safety monitoring&#x2014;stage 5) includes applications related to clinical trials in phase IV and pharmacovigilance. Regulatory review (stage 4) acts as a bridge between the premarket and the postmarket phases and is not covered in this review.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Artificial intelligence applications for safety risk assessment in drug design and development fall into 2 main categories: safety prediction and ADE detection. The artificial intelligence&#x2013;based analysis process involves three steps: (1) representation: input data, such as chemical compounds and free-text descriptions, are encoded as vectors, heavily supported by learning models. (2) Learning: models are developed to infer safety risks from these data. (3) Prediction: various safety risks are predicted or detected, followed by an evaluation of performance metrics. ADE: adverse drug event; EHR: electronic health record; EL: entity linking; ER: entity relation; NER: named entity recognition.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v5i1e77732_fig03.png"/></fig></sec><sec id="s3-2"><title>Safety Prediction</title><p>The safety prediction category (top image of <xref ref-type="fig" rid="figure3">Figure 3</xref>) encompasses LM-based applications that can predict safety risks before synthesis and preclinical or clinical testing, given a drug or compound formulation. These applications can be used during the discovery and development stage to support screening and during the preclinical and clinical research stages to support safety risk assessment. Prediction studies can be further subdivided into 3 predictive application use cases: toxicity [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref41">41</xref>-<xref ref-type="bibr" rid="ref48">48</xref>], ADEs [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>], and severity [<xref ref-type="bibr" rid="ref51">51</xref>]. Toxicity prediction methods are often binary classifiers that predict whether a drug or compound will be toxic for an organ, such as drug-induced liver injury prediction [<xref ref-type="bibr" rid="ref52">52</xref>-<xref ref-type="bibr" rid="ref55">55</xref>], or regressors that predict toxicity properties, such as skin sensitization scores [<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref57">57</xref>]. In ADE prediction, AI methods supported by LMs are designed to predict the occurrence of ADEs, that is, injuries resulting from the use of a drug. These methods are usually multiclass, multilabel classifiers that infer the occurrence of adverse event categories, such as those proposed by the Medical Dictionary for Regulatory Activities (MedDRA) terminology. Conversely, methods for ADE severity prediction are usually binary classifiers that aim to infer the severity of ADEs, such as serious versus nonserious or death versus nondeath events. In terms of phase, these studies (n=16) are concentrated in the premarket pharmaceutical research stage, with the notable exception of the study by Mazuz et al [<xref ref-type="bibr" rid="ref51">51</xref>], which focuses on predicting drug withdrawal based on safety concerns.</p></sec><sec id="s3-3"><title>ADE Detection</title><p>The ADE detection category (bottom image of <xref ref-type="fig" rid="figure3">Figure 3</xref>) encompasses LM applications that extract ADE-related information from individual documents in a given corpus so that signal detection can be performed. These detection studies can be further subdivided into 2 categories: information extraction, including NER [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref58">58</xref>-<xref ref-type="bibr" rid="ref65">65</xref>], relation extraction (RE) [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref66">66</xref>-<xref ref-type="bibr" rid="ref69">69</xref>], entity linking (EL) [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref62">62</xref>], and document classification, including ADE mentioning in documents [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref70">70</xref>-<xref ref-type="bibr" rid="ref74">74</xref>] and their seriousness [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref75">75</xref>]. NER methods are used to identify ADE-related entities, such as drugs, dosage, route of administration, and ADE names, in relevant pharmacovigilance corpora, such as patient forums [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref28">28</xref>-<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref76">76</xref>] and social media [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref59">59</xref>-<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref71">71</xref>,<xref ref-type="bibr" rid="ref76">76</xref>]. RE methods are often combined with NER methods to identify relationships between ADE-related entities. For example, they can establish whether a drug is associated with an ADE [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref67">67</xref>], while EL methods are used to normalize ADE entities against standard terminologies in the field, such as MedDRA [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref62">62</xref>]. These tasks ultimately enable the structuring of ADE-related information found in free-text corpora, allowing for further computation of ADE cases for a given drug and the application of signal detection algorithms. Document classification is a simpler task, in which text passages, such as tweets [<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref71">71</xref>,<xref ref-type="bibr" rid="ref74">74</xref>], posts in patient forums [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref76">76</xref>], or incident reports [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref75">75</xref>], are classified as containing ADE information or the seriousness of the reported ADE [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref75">75</xref>]. Unlike the information extraction category, the goal here is to triage large corpora to reduce the cost of manual processing or enable further automated information extraction. Stage-wise, these studies (n=33) are concentrated in the postmarket safety monitoring stage (<xref ref-type="table" rid="table3">Table 3</xref>).</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Overview of included studies by application category across the drug development lifecycle.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Application</td><td align="left" valign="bottom">Studies</td></tr></thead><tbody><tr><td align="left" valign="top">Safety prediction</td><td align="left" valign="top">[<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref41">41</xref>-<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref77">77</xref>]</td></tr><tr><td align="left" valign="top">ADE<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup> detection</td><td align="left" valign="top">[<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref36">36</xref>-<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref58">58</xref>-<xref ref-type="bibr" rid="ref76">76</xref>]</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>ADE: adverse drug event.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-4"><title>For Which Organs and Toxicity Endpoints Are LMs Used for in Safety Analysis?</title><p>ADEs can manifest in various organs; yet, most reviewed studies addressed ADE prediction in a general context rather than focusing on specific organ toxicities. This is mainly the case of AI models for ADE detection in the postmarket safety monitoring stage. These models often leverage terminologies such as the MedDRA [<xref ref-type="bibr" rid="ref78">78</xref>] or the World Health Organization Anatomical Therapeutic Chemical classification system [<xref ref-type="bibr" rid="ref79">79</xref>] to infer the occurrence of adverse event categories across broad organ systems [<xref ref-type="bibr" rid="ref80">80</xref>,<xref ref-type="bibr" rid="ref81">81</xref>]. When it comes to the pharmaceutical research (premarket) stage, we see a shift toward predicting organ-specific toxicities with binary classifiers, which assess whether a compound will be toxic to particular organs [<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref82">82</xref>-<xref ref-type="bibr" rid="ref86">86</xref>].</p><p>The heart (n=6) [<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref48">48</xref>] and liver (n=4) [<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref46">46</xref>] emerge as the most studied organs for organ-specific ADE prediction (<xref ref-type="table" rid="table4">Table 4</xref>), likely due to their roles in drug metabolism and systemic effects, respectively. Our screening shows that predicting ADEs in other organs, such as the brain or pancreas, poses a greater challenge due to limited experimental data and the inherent difficulty that comes from the resource-intensive and complex methodologies needed in assessing toxicity for these organs [<xref ref-type="bibr" rid="ref87">87</xref>,<xref ref-type="bibr" rid="ref88">88</xref>].</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Organ systems and toxicity endpoints evaluated in the included studies.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="top">Category and subcategory</td><td align="left" valign="top">Studies, n</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="2">Organ</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Heart</td><td align="char" char="." valign="top">6</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Liver</td><td align="char" char="." valign="top">4</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Bone</td><td align="char" char="." valign="top">2</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Skin</td><td align="char" char="." valign="top">2</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Eye</td><td align="char" char="." valign="top">2</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Other</td><td align="char" char="." valign="top">5</td></tr><tr><td align="left" valign="top" colspan="2">Endpoint</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Cardiotoxicity</td><td align="char" char="." valign="top">7</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hepatotoxicity</td><td align="char" char="." valign="top">4</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Carcinogenicity</td><td align="char" char="." valign="top">3</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Median lethal dose</td><td align="char" char="." valign="top">3</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Peptide toxicity</td><td align="char" char="." valign="top">3</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mutagenicity</td><td align="char" char="." valign="top">2</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Osteotoxicity</td><td align="char" char="." valign="top">2</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Skin reaction</td><td align="char" char="." valign="top">2</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Other</td><td align="char" char="." valign="top">7</td></tr></tbody></table></table-wrap><p>Of the many toxicity endpoints that different groups have tried to develop models for, the prediction of cardiotoxicity [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref48">48</xref>] and drug-induced liver injury [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref46">46</xref>] are particularly well-represented in the literature (<xref ref-type="table" rid="table4">Table 4</xref>), reflecting their clinical significance and data availability for these toxicity endpoints. Models able to provide such predictions can serve as a filter to identify potentially harmful drugs in the premarket stage and reduce the failure risk in the later drug development stages.</p></sec><sec id="s3-5"><title>What Types of LMs Have Been Used to Analyze Safety Risks in Drug Design and Development?</title><p>Assessment of LM use over time reveals a clear evolution in methodological choices (<xref ref-type="fig" rid="figure4">Figure 4A</xref>). Until 2018, all studies relied exclusively on static LMs [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref71">71</xref>]. Between 2019 and 2022, a more balanced use of static and contextualized LMs was observed, reflecting a transitional phase toward context-aware representations [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref58">58</xref>-<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref64">64</xref>]. From 2023 onward, more advanced architectures emerged, with the introduction of encoder-decoder models and LLMs [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref63">63</xref>], which rapidly gained prominence, accounting for approximately half of the studies included by 2025. Notably, no publication from 2024 used encoder-decoder models or LLMs. This pattern may be because most of the papers published in 2024 that we included in our review [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref46">46</xref>] were preclinical studies, which primarily rely on discriminative models rather than more recent generative LMs. However, stochastic variation in publication trends cannot be excluded.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Artificial intelligence algorithms used for safety risk assessment in pharmaceutical research and development. (A) Studies published per year from 2015 to 2025, grouped by LM type: static, contextualized, encoder-decoder, and large. (B) Distribution of studies across different LM architectures. (C) Studies stratified by LM architecture type: discriminative, encoder-decoder, and generative. (D) Classical machine learning and deep learning approaches. BART: bidirectional and auto-regressive transformer; BERT: bidirectional encoder representations from transformers; CNN: convolutional neural network; CRF: conditional random field; ELECTRA: efficiently learning an encoder that classifies token replacements accurately; GBoost: (extreme) gradient boosting; GNN: graph neural network; kNN: k-nearest neighbors; LM: language model; LR: logistic regression; NodeEmb: node embedding; RF: random forest; RNN: recurrent neural network; SVM: support vector machine; Tree: decision tree.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v5i1e77732_fig04.png"/></fig><p>Further analysis of the LMs used across the included studies shows that the majority relied on the bidirectional encoder representations from transformers (BERT) architecture (n=24; <xref ref-type="fig" rid="figure4">Figure 4B</xref>) [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref26">26</xref>-<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref75">75</xref>,<xref ref-type="bibr" rid="ref77">77</xref>]. This predominance is consistent with the architectural design of BERT as an encoder-only, bidirectional model, which is particularly well-suited for generating high-quality contextualized embeddings for downstream tasks such as classification, similarity analysis, and information retrieval. In contrast, large generative models such as GPT-4 or LLaMA are primarily optimized for autoregressive text generation rather than embedding extraction, making BERT-based models generally more precise and computationally efficient for representation learning purposes. The word2vec model (n=13) was the second most frequently used [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref64">64</xref>-<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref71">71</xref>], followed by more recent approaches, such as RoBERTa (n=7) [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref73">73</xref>,<xref ref-type="bibr" rid="ref75">75</xref>] and GPT (n=6) [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref73">73</xref>,<xref ref-type="bibr" rid="ref76">76</xref>] architectures. A substantial proportion of studies using these models was conducted for safety risk assessment in postmarket settings. This predominance of postmarket applications can be explained by the fact that the tasks most related to this phase, that is, information extraction and document classification (<xref ref-type="fig" rid="figure2">Figure 2B</xref>), rely extensively on natural language processing. In contrast, the use of LMs, such as ChemBERTa, especially for molecular representations in premarket studies, is a more recent adaptation of language modeling to other data modalities.</p><p>If we look at the model architectures across the included studies (<xref ref-type="fig" rid="figure4">Figure 4C</xref>), we see a clear predominance of discriminative approaches (n=44), that is, LMs that focus on learning the boundaries between different tokens in a corpus, such as BERT [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref75">75</xref>], word2vec [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref64">64</xref>], and XLNet [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref31">31</xref>]. These models are used for tasks such as NER and RE, as well as toxicity and ADE prediction [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref70">70</xref>-<xref ref-type="bibr" rid="ref73">73</xref>]. Discriminative models, often implemented as fine-tuned, encoder-based transformer architectures, are particularly well-suited to these objectives, as they are optimized for classification and sequence labeling tasks that rely on well-defined input-output mappings. In contrast, studies leveraging generative LMs, that is, models that generate text by predicting the next token based on preceding context, focus on NER [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref73">73</xref>,<xref ref-type="bibr" rid="ref76">76</xref>] (n=6), benefiting from the zero-shot learning (ie, without annotated data) capabilities of those models. As seen from <xref ref-type="fig" rid="figure4">Figure 4A</xref>, the use of these models has significantly increased in the last year of the survey, benefiting from the recent progress made in LLMs.</p><p>LLM-based models are often used in combination with classical ML (n=4) [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref68">68</xref>] and deep learning (DL) models (n=31) [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref42">42</xref>-<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref71">71</xref>,<xref ref-type="bibr" rid="ref76">76</xref>]. Among the ML and DL models used in parallel or in combination with LLMs, support vector machines (SVMs) are the most prevalent (n=13) [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref71">71</xref>], followed by graph neural networks (GNNs; n=12) [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref41">41</xref>-<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref76">76</xref>], then recurrent neural networks (RNNs; n=10) [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref65">65</xref>], with convolutional neural networks (CNNs; n=8) [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref71">71</xref>,<xref ref-type="bibr" rid="ref74">74</xref>] used at a comparable frequency to conditional random fields (CRFs; n=8) [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref64">64</xref>-<xref ref-type="bibr" rid="ref66">66</xref>]. Overall, SVM and CRF are the most used among classical ML approaches, whereas GNNs, RNNs, and CNNs are predominant among DL methods. In addition, across the reviewed studies, GNNs are primarily used for molecular representations [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref41">41</xref>-<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref51">51</xref>], whereas SVMs, RNNs, CNNs, and CRFs are mainly used for both molecular representation [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref41">41</xref>-<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref46">46</xref>-<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref50">50</xref>] and clinical text data [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref68">68</xref>].</p></sec><sec id="s3-6"><title>What Are the Data Sources and Metrics Used for Training and Evaluating LM Methods for Safety Assessment in Pharma R&#x0026;D?</title><p>AI-based safety assessment studies in Pharma R&#x0026;D leverage diverse structured and unstructured data sources for safety prediction and ADE detection (<xref ref-type="table" rid="table5">Table 5</xref>). Premarket studies focusing on molecular representations primarily rely on curated chemical and pharmacological datasets, with SIDER (n=6) [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref48">48</xref>-<xref ref-type="bibr" rid="ref50">50</xref>] and ClinTox (n=3) [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref45">45</xref>] being the most frequently used resources, reflecting their central role in modeling toxicity and drug-ADE associations. Knowledge bases such as DrugBank, ChEMBL, and PubChem further complement these analyses by providing chemical and biological context.</p><table-wrap id="t5" position="float"><label>Table 5.</label><caption><p>Main datasets used by dataset type and study data focus.</p></caption><table id="table5" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Dataset</td><td align="left" valign="bottom">Dataset type</td><td align="left" valign="bottom" colspan="5">Study data focus</td><td align="left" valign="bottom">All</td></tr><tr><td align="left" valign="bottom"/><td align="left" valign="bottom"/><td align="left" valign="bottom">Molecular representation</td><td align="left" valign="bottom">Social media</td><td align="left" valign="bottom">Clinical text</td><td align="left" valign="bottom">Scientific literature</td><td align="left" valign="bottom">Incident reports</td><td align="left" valign="bottom"/></tr></thead><tbody><tr><td align="left" valign="top">SIDER [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref48">48</xref>-<xref ref-type="bibr" rid="ref50">50</xref>]</td><td align="left" valign="top">ADE<sup><xref ref-type="table-fn" rid="table5fn1">a</xref></sup>-specific knowledge resources</td><td align="left" valign="top">6</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">8</td></tr><tr><td align="left" valign="top">ClinTox [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td><td align="left" valign="top">ADE-specific knowledge resources</td><td align="left" valign="top">3</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">3</td></tr><tr><td align="left" valign="top">ATSE [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref43">43</xref>]</td><td align="left" valign="top">ADE-specific knowledge resources</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td></tr><tr><td align="left" valign="top">CTD [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref48">48</xref>]</td><td align="left" valign="top">ADE-specific knowledge resources</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td></tr><tr><td align="left" valign="top">DILI<sup><xref ref-type="table-fn" rid="table5fn2">b</xref></sup> [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]</td><td align="left" valign="top">ADE-specific knowledge resources</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td></tr><tr><td align="left" valign="top">ToxinPred2 [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref43">43</xref>]</td><td align="left" valign="top">ADE-specific knowledge resources</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td></tr><tr><td align="left" valign="top">CT-ADE [<xref ref-type="bibr" rid="ref25">25</xref>]</td><td align="left" valign="top">ADE-specific knowledge resources</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td></tr><tr><td align="left" valign="top">SMM4H (Twitter) [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref76">76</xref>]</td><td align="left" valign="top">Social media&#x2013;annotated datasets</td><td align="left" valign="top">0</td><td align="left" valign="top">8</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">8</td></tr><tr><td align="left" valign="top">CADEC (patient forum) [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref76">76</xref>]</td><td align="left" valign="top">Social media&#x2013;annotated datasets</td><td align="left" valign="top">0</td><td align="left" valign="top">5</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">5</td></tr><tr><td align="left" valign="top">Twitter [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref74">74</xref>]</td><td align="left" valign="top">Social media&#x2013;annotated datasets</td><td align="left" valign="top">0</td><td align="left" valign="top">4</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">4</td></tr><tr><td align="left" valign="top">Patient forum [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref61">61</xref>]</td><td align="left" valign="top">Social media&#x2013;annotated datasets</td><td align="left" valign="top">0</td><td align="left" valign="top">3</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">3</td></tr><tr><td align="left" valign="top">ADHD (Twitter) [<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref71">71</xref>]</td><td align="left" valign="top">Social media&#x2013;annotated datasets</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td></tr><tr><td align="left" valign="top">PsyTAR (patient forum) [<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref76">76</xref>]</td><td align="left" valign="top">Social media&#x2013;annotated datasets</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td></tr><tr><td align="left" valign="top">Reddit [<xref ref-type="bibr" rid="ref39">39</xref>]</td><td align="left" valign="top">Social media&#x2013;annotated datasets</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">2</td></tr><tr><td align="left" valign="top">DailyStrength (patient forum) [<xref ref-type="bibr" rid="ref29">29</xref>]</td><td align="left" valign="top">Social media&#x2013;annotated datasets</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td></tr><tr><td align="left" valign="top">EHR (private) [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref66">66</xref>-<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref72">72</xref>]</td><td align="left" valign="top">Annotated clinical reports</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">5</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">5</td></tr><tr><td align="left" valign="top">MADE (EHR) [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref58">58</xref>]</td><td align="left" valign="top">Annotated clinical reports</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td></tr><tr><td align="left" valign="top">n2c2 (EHR) [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]</td><td align="left" valign="top">Annotated clinical reports</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td></tr><tr><td align="left" valign="top">ClinicalTrials.gov [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td><td align="left" valign="top">Annotated scientific literature</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">3</td></tr><tr><td align="left" valign="top">PubMed or MEDLINE [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref70">70</xref>]</td><td align="left" valign="top">Annotated scientific literature</td><td align="left" valign="top">1</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">4</td></tr><tr><td align="left" valign="top">TAC [<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref76">76</xref>]</td><td align="left" valign="top">Annotated scientific literature</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td></tr><tr><td align="left" valign="top">ADE-corpus-v2 (PubMed) [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref73">73</xref>]</td><td align="left" valign="top">Annotated scientific literature</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">3</td></tr><tr><td align="left" valign="top">FAERS<sup><xref ref-type="table-fn" rid="table5fn3">c</xref></sup> [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref61">61</xref>]</td><td align="left" valign="top">Incident report systems</td><td align="left" valign="top">3</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td><td align="left" valign="top">7</td></tr><tr><td align="left" valign="top">EU-ADR [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref49">49</xref>]</td><td align="left" valign="top">Incident report systems</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td></tr><tr><td align="left" valign="top">ANSM [<xref ref-type="bibr" rid="ref75">75</xref>]</td><td align="left" valign="top">Incident report systems</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">1</td></tr><tr><td align="left" valign="top">FDA [<xref ref-type="bibr" rid="ref37">37</xref>]</td><td align="left" valign="top">Incident report systems</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">1</td></tr><tr><td align="left" valign="top">Health Canada [<xref ref-type="bibr" rid="ref37">37</xref>]</td><td align="left" valign="top">Incident report systems</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">1</td></tr><tr><td align="left" valign="top">Jiangsu ADR Mon. Center [<xref ref-type="bibr" rid="ref64">64</xref>]</td><td align="left" valign="top">Incident report systems</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">1</td></tr><tr><td align="left" valign="top">KAERS [<xref ref-type="bibr" rid="ref62">62</xref>]</td><td align="left" valign="top">Incident report systems</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">1</td></tr><tr><td align="left" valign="top">DrugBank [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref76">76</xref>]</td><td align="left" valign="top">Knowledge base, biomedical terminologies, and databases</td><td align="left" valign="top">7</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">10</td></tr><tr><td align="left" valign="top">ChEMBL [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref51">51</xref>]</td><td align="left" valign="top">Knowledge base, biomedical terminologies, and databases</td><td align="left" valign="top">5</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">7</td></tr><tr><td align="left" valign="top">PubChem [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref50">50</xref>]</td><td align="left" valign="top">Knowledge base, biomedical terminologies, and databases</td><td align="left" valign="top">3</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">4</td></tr><tr><td align="left" valign="top">UniProt [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref43">43</xref>]</td><td align="left" valign="top">Knowledge base, biomedical terminologies, and databases</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td></tr><tr><td align="left" valign="top">ZINC [<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref46">46</xref>]</td><td align="left" valign="top">Knowledge base, biomedical terminologies, and databases</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td></tr><tr><td align="left" valign="top">MedDRA<sup><xref ref-type="table-fn" rid="table5fn4">d</xref></sup> [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref62">62</xref>]</td><td align="left" valign="top">Knowledge base, biomedical terminologies, and databases</td><td align="left" valign="top">1</td><td align="left" valign="top">4</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td><td align="left" valign="top">2</td><td align="left" valign="top">9</td></tr><tr><td align="left" valign="top">OMOP [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref49">49</xref>]</td><td align="left" valign="top">Knowledge base, biomedical terminologies, and databases</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">3</td></tr><tr><td align="left" valign="top">UMLS [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref61">61</xref>]</td><td align="left" valign="top">Knowledge base, biomedical terminologies, and databases</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">3</td></tr><tr><td align="left" valign="top">ATC<sup><xref ref-type="table-fn" rid="table5fn5">e</xref></sup> [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref76">76</xref>]</td><td align="left" valign="top">Knowledge base, biomedical terminologies, and databases</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td></tr></tbody></table><table-wrap-foot><fn id="table5fn1"><p><sup>a</sup>ADE: adverse drug event.</p></fn><fn id="table5fn2"><p><sup>b</sup>DILI: drug-induced liver injury.</p></fn><fn id="table5fn3"><p><sup>c</sup>FAERS: FDA Adverse Event Reporting System Database.</p></fn><fn id="table5fn4"><p><sup>d</sup>MedDRA: Medical Dictionary for Regulatory Activities.</p></fn><fn id="table5fn5"><p><sup>e</sup>ATC: Anatomical Therapeutic Chemical.</p></fn></table-wrap-foot></table-wrap><p>Postmarket safety monitoring predominantly exploits real-world data, including social media, clinical text, and reporting systems. Twitter-based datasets from SMM4H (n=8) [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref76">76</xref>] and CADEC (n=5) [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref76">76</xref>] are widely used to capture patient-reported ADEs and enable near real-time signal detection. Clinical text-based studies mainly rely on annotated EHRs (n=5) [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref66">66</xref>-<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref72">72</xref>], as well as MADE and n2c2 datasets, to support supervised ADE extraction. Across all data focuses, scientific literature sources (eg, ClinicalTrials.gov and PubMed or MEDLINE) [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref70">70</xref>] and spontaneous reporting systems such as the FDA Adverse Event Reporting System Database (FAERS) [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref61">61</xref>] provide complementary evidence for large-scale pharmacovigilance analyses.</p><p>As shown in <xref ref-type="fig" rid="figure5">Figure 5A</xref>, distinct methodological trends can be observed with respect to the targeted tasks across the different data focus categories, namely, molecular representation, social media, clinical text, scientific literature, and incident reports. Studies relying on molecular representations predominantly focus on toxicity prediction [<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref41">41</xref>-<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref77">77</xref>], reflecting their emphasis on molecular structure features for safety risk assessment. In contrast, studies leveraging social media, clinical text, scientific literature, and incident reports primarily address NER [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref58">58</xref>-<xref ref-type="bibr" rid="ref65">65</xref>], as these data sources consist largely of unstructured text for which entity identification is a foundational step. Within these text-based domains, social media&#x2013;based studies also place a strong emphasis on EL, aiming to normalize patient-reported mentions of drugs and ADEs to standardized vocabularies [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref61">61</xref>]. Clinical text-focused studies, on the other hand, more frequently target RE as the additional task [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref66">66</xref>-<xref ref-type="bibr" rid="ref68">68</xref>], seeking to identify explicit associations between drugs and ADEs within clinical narratives. Studies based on incident reports exhibit a broader task spectrum, commonly integrating NER, EL, and RE [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref64">64</xref>], in addition to document classification [<xref ref-type="bibr" rid="ref37">37</xref>] and signal detection [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref39">39</xref>], to facilitate triage and fully exploit structured reporting formats for pharmacovigilance signal detection, enabling a comprehensive pharmacovigilance analysis.</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Overview of data sources and evaluation metrics used for training and validation, including data focus by task type, evaluation metrics, dataset language, and dataset accessibility. (<bold>A</bold>) Number of studies by data focus category stratified by task type. (<bold>B</bold>) Number of studies by evaluation metrics. (<bold>C</bold>) Distribution of studies by dataset language. (<bold>D</bold>) Number of studies by dataset accessibility: public versus private. ADE: adverse drug event; AUPRC: area under the precision-recall curve; AUROC: area under the receiver operating characteristic curve; EN: English; FR: French; KR: Korean; MCC: Matthews correlation coefficient; NER: named entity recognition; PRR: proportional reporting ratio; ROR: reporting odds ratio; RU: Russian; ZH: Chinese.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v5i1e77732_fig05.png"/></fig><p>With respect to the evaluation metrics (<xref ref-type="fig" rid="figure5">Figure 5B</xref>) used, clear differences emerge between premarket and postmarket evaluation practices. Metrics such as the <italic>F</italic><sub>1</sub>-score, sensitivity (recall), and precision are most frequently reported overall, largely due to their extensive use in postmarket studies [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref58">58</xref>-<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref74">74</xref>]. In contrast, evaluation metrics, including the area under the receiver operating characteristic curve (AUROC), Matthews correlation coefficient, accuracy, specificity, and balanced accuracy, are predominantly used to assess premarket studies [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref41">41</xref>-<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref77">77</xref>]. Certain metrics, notably the reporting odds ratio and proportional reporting ratio, are exclusively used in postmarket settings for statistical signal detection [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>-<xref ref-type="bibr" rid="ref39">39</xref>].</p><p>Most of the reviewed papers use English datasets (n=28) [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref58">58</xref>-<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref70">70</xref>] and publicly available data (n=38) [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref46">46</xref>-<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref73">73</xref>] (<xref ref-type="fig" rid="figure5">Figure 5D</xref>), reflecting the widespread use of open premarketing chemical and postmarketing pharmacological databases in this domain [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref71">71</xref>,<xref ref-type="bibr" rid="ref77">77</xref>]. A minority of papers analyze other European languages, such as French (n=2) [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref75">75</xref>] and Swedish (n=2) [<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref67">67</xref>], and Asian languages, such as Korean (n=1) [<xref ref-type="bibr" rid="ref62">62</xref>] and Chinese (n=1) [<xref ref-type="bibr" rid="ref64">64</xref>]. In contrast, studies focusing on clinical text are proportionally more likely to rely on private data sources [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref66">66</xref>-<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref72">72</xref>], highlighting the restricted access associated with clinical records and institutional electronic health data.</p><p>Regarding the features used for different tasks (<xref ref-type="table" rid="table6">Table 6</xref>), word embeddings and molecular embeddings are the most used. Word embeddings are predominantly used for NER (n=23) [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref63">63</xref>-<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref76">76</xref>] but are also applied across most other tasks [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref68">68</xref>-<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref74">74</xref>,<xref ref-type="bibr" rid="ref75">75</xref>], except for toxicity prediction. In this case, LMs are primarily for feature engineering, converting natural language symbols into dense representations. Toxicity prediction tasks, which are mainly addressed in premarket studies, rely primarily on molecular embedding features (n=10) [<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref41">41</xref>-<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref48">48</xref>], derived using LMs (molecular or protein LMs to be specific). N-gram features rank third in terms of use frequency and are used to a lesser extent than embeddings, often as complementary features. As with word embeddings, n-grams are not used for toxicity prediction, further highlighting the task&#x2019;s reliance on structured molecular representations rather than textual features.</p><table-wrap id="t6" position="float"><label>Table 6.</label><caption><p>Main features used in the analyzed studies across the different tasks.</p></caption><table id="table6" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Features</td><td align="left" valign="bottom">NER<sup><xref ref-type="table-fn" rid="table6fn1">a</xref></sup></td><td align="left" valign="bottom">Toxicity prediction</td><td align="left" valign="bottom">ADE<sup><xref ref-type="table-fn" rid="table6fn2">b</xref></sup> detection</td><td align="left" valign="bottom">RE<sup><xref ref-type="table-fn" rid="table6fn3">c</xref></sup></td><td align="left" valign="bottom">Signal detection</td><td align="left" valign="bottom">ADE seriousness</td><td align="left" valign="bottom">EL<sup><xref ref-type="table-fn" rid="table6fn4">d</xref></sup></td><td align="left" valign="bottom">ADE prediction</td><td align="left" valign="bottom">ADE summary</td></tr></thead><tbody><tr><td align="left" valign="top">Word embedding</td><td align="left" valign="top">23</td><td align="left" valign="top">0</td><td align="left" valign="top">6</td><td align="left" valign="top">7</td><td align="left" valign="top">5</td><td align="left" valign="top">3</td><td align="left" valign="top">5</td><td align="left" valign="top">2</td><td align="left" valign="top">1</td></tr><tr><td align="left" valign="top">molecular embedding</td><td align="left" valign="top">0</td><td align="left" valign="top">10</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">n-gram</td><td align="left" valign="top">4</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td><td align="left" valign="top">2</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">TF-IDF<sup><xref ref-type="table-fn" rid="table6fn5">e</xref></sup></td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">3</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Molecular property</td><td align="left" valign="top">0</td><td align="left" valign="top">3</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Lexicon</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Molecular fingerprint</td><td align="left" valign="top">0</td><td align="left" valign="top">4</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Categorical</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Molecular descriptor</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Node embedding</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Protein embedding</td><td align="left" valign="top">0</td><td align="left" valign="top">2</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Sentence embedding</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td></tr></tbody></table><table-wrap-foot><fn id="table6fn1"><p><sup>a</sup>NER: named entity recognition. </p></fn><fn id="table6fn2"><p><sup>b</sup>ADE: adverse drug event.</p></fn><fn id="table6fn3"><p><sup>c</sup>RE: relation extraction. </p></fn><fn id="table6fn4"><p><sup>d</sup>EL: entity linking.</p></fn><fn id="table6fn5"><p><sup>e</sup>TF-IDF: term frequency-inverse document frequency.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-7"><title>What Are the Current Limitations of LM Approaches for AI-Based ADE Analysis?</title><p>Despite rapid methodological progress, the reviewed literature reveals that there are several persistent limitations that constrain the reliability, generalizability, and practical utility of LM-based methods for safety prediction and detection across the drug development lifecycle.</p><p>Many studies rely on English-language corpora [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref60">60</xref>], spanning social media benchmarks, patient forums, and biomedical literature, as well as many publicly available ADE corpora used in modeling pipelines. This creates a bias, whereby models trained and evaluated primarily on English might underperform when deployed on non-English narratives, where lexical variation or different naming conventions could alter information extraction performance. Beyond language, geographic bias [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref64">64</xref>] could emerge because prescribing patterns or drug availability vary across health care systems. Models trained on US data sources may not be applicable in other jurisdictions without adaptation.</p><p>Although many postmarket studies extract ADE mentions or compute signals from real-world sources, none validate downstream findings against established postmarketing evidence. For example, several studies have extracted and normalized ADE from social media [<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref65">65</xref>]. However, none of them report how these findings compare with ADEs validated in phase IV clinical trials. Without robust external validation, it remains difficult to quantify the proportion of signals representing actionable findings rather than noise. ADE detection in postmarket settings is often framed as information extraction, primarily NER [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref73">73</xref>] and RE [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref68">68</xref>], to structure what is stated in narratives. The goal of these systems is not to establish biomedical causality. Instead, they aim to identify causal attributions as expressed by the author, whether clinician or patient, and to make that information usable for downstream pharmacovigilance workflows. However, translating extracted attributions into actionable safety assessments requires further analysis. Real-world safety evaluation must account for factors such as confounding by indication and differences in target populations. This is essential because the likelihood and severity of ADEs are context-dependent and can vary with determinants such as underlying disease, dose, and treatment duration. This contextuality also highlights a key limitation of many premarket resources and toxicity prediction pipelines. These resources and pipelines often rely on decontextualized representations of compounds and therefore miss patient- and regimen-specific determinants that shape how adverse outcomes manifest in practice.</p><p>Across studies, evaluation most commonly centers on <italic>F</italic><sub>1</sub>-score [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref48">48</xref>], precision or recall [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref74">74</xref>,<xref ref-type="bibr" rid="ref75">75</xref>], and AUROC [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref48">48</xref>]. In premarket safety prediction studies, AUROC and accuracy are predominant. While these are useful metrics, they should be interpreted with caution in the presence of class imbalance, which is common in toxicity and ADE datasets. In such settings, AUROC or accuracy may mask poor performance on rare but safety-critical events and should therefore be reported alongside more robust metrics such as balanced accuracy, Matthews correlation coefficient, and <italic>F</italic><sub>1</sub>-score. Moreover, calibration is rarely assessed, despite being essential when model outputs are used to rank safety risks or trigger alerts. A model can achieve strong discrimination while producing poorly calibrated probabilities, which can lead to inappropriate decision thresholds and misinterpretation of predicted risk. In addition, the literature remains skewed toward postmarket detection, with comparatively few LM applications that integrate into early development decisions. This imbalance restricts the ability of LM methods to support proactive risk mitigation, where earlier detection could reduce attrition and patient harm.</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>AI, and LMs in particular, is increasingly influencing how ADEs are anticipated and monitored throughout the drug development lifecycle. The recent acceleration in this field is not simply a result of wider adoption of AI. It also reflects a methodological consolidation where LMs provide a common framework for learning from molecular structure [<xref ref-type="bibr" rid="ref41">41</xref>-<xref ref-type="bibr" rid="ref43">43</xref>] and human-generated text [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref63">63</xref>]. By mapping LM applications from premarket pharmaceutical research through postmarket safety monitoring, this scoping review captures an evolution from static embedding methods [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref66">66</xref>] toward contextualized transformer encoders [<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref72">72</xref>] and, more recently, LLMs [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref63">63</xref>].</p><p>Across the 49 studies included in this review, which were published between 2015 and October 15, 2025, LM-based applications are more strongly represented in postmarket ADE detection (n=33) than in premarket safety prediction (n=16). Postmarket studies typically implement pharmacovigilance as information extraction tasks, including NER, RE, EL [<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref66">66</xref>], and document-level classification [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref74">74</xref>], tasks for which LMs are naturally designed. In contrast, premarket studies most often frame safety as a predictive modeling problem over compound representations, in which LMs act as feature learners that enable toxicity prediction [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref46">46</xref>] before synthesis, extensive preclinical testing, or clinical evaluation. Taken together, these 2 aspects illustrate how LMs function as a bridging technology throughout the process by standardizing representation learning across data modalities and enabling safety assessment within a unified methodological family.</p><p>With respect to the safety outcomes addressed, organ-specific prediction remains focused on a limited set of endpoints that are both clinically relevant and well supported by the available training data. Heart and liver toxicities predominate among organ-targeted studies, and accordingly, cardiotoxicity and hepatotoxicity emerge as the most modeled endpoints [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref41">41</xref>]. Conversely, less frequently modeled organs, such as the brain [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref48">48</xref>], experience a scarcity of high-quality labeled datasets and the experimental complexity required to generate ground truth for these tissues. As a result, methodological progress is currently strongest, where data availability is favorable, while important gaps persist for rarer, complex, or difficult-to-measure toxicities.</p></sec><sec id="s4-2"><title>Comparison to Prior Work</title><p>The included literature shows a clear methodological progression from static representations in earlier years to contextualized encoders and, more recently, to the recent emergence of LLMs. Despite increased attention to generative systems, most of the included studies remain centered on discriminative, encoder-based architectures, aligning with the predominance of supervised extraction and classification tasks. BERT-family models are the most frequently used contextualized architectures [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref76">76</xref>], while word2vec remains common [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref61">61</xref>], often within hybrid pipelines that combine learned embeddings with classical ML or DL classifiers [<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref71">71</xref>]. The continuing dominance of discriminative approaches is consistent with their comparatively lower computational requirements and stable supervised training behavior, as well as the availability of annotated datasets suited for supervised learning [<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref72">72</xref>]. Furthermore, the pharmaceutical industry&#x2019;s regulatory framework favors deterministic reliability over generative flexibility. While LLMs offer powerful zero-shot capabilities, their propensity for hallucination poses a safety risk in pharmacovigilance, where a fabricated ADE signal is as dangerous as a missed one. The future dominance of LLMs will likely depend less on their generative fluency and more on the development of guardrails and grounding mechanisms that can satisfy regulatory rigor.</p><p>At the same time, the increasing appearance of LLMs, particularly in the most recent portion of the review period, suggests a shift toward approaches that can exploit zero-shot or few-shot capabilities, which could reduce dependence on costly annotation. In the reviewed evidence, however, this generative turn is most represented in postmarket extraction settings rather than spanning the full drug development lifecycle uniformly.</p></sec><sec id="s4-3"><title>Future Directions</title><p>The data ecosystems underlying pre- and postmarket applications differ systematically. Premarket prediction studies largely rely on curated chemical and toxicity resources (eg, SIDER, ClinTox, and CTD) [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref49">49</xref>] and are frequently complemented by established knowledge bases providing chemical and biological context (eg, DrugBank, ChEMBL, and PubChem) [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref50">50</xref>]. Postmarket detection studies predominantly leverage real-world narrative sources, including social media benchmarks (eg, SMM4H and CADEC) [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref76">76</xref>] and clinical text resources (eg, private EHR datasets, MADE, and n2c2) [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref72">72</xref>]. These differences in the data are mirrored in the evaluation practices, with postmarket studies typically reporting precision, recall, and <italic>F</italic><sub>1</sub>-scores [<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref62">62</xref>], whereas premarket studies more frequently emphasize AUROC and accuracy [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref77">77</xref>]. While such metric choices are conventional for the respective task families, they complicate comparisons across pipeline stages and can obscure safety-relevant weaknesses. High entity-level <italic>F</italic><sub>1</sub>, for example, does not necessarily translate into reliable pharmacovigilance decisions unless downstream signal utility is demonstrated. Similarly, AUROC and accuracy can remain favorable under class imbalance, potentially masking poor performance on rare but clinically significant events. Consequently, the field experiences a metric-utility misalignment. In safety surveillance, the cost of a false negative (missing a fatal ADE) vastly outweighs the cost of a false positive (unnecessary review). Yet, many reviewed studies optimize for balanced metrics like <italic>F</italic><sub>1</sub>-score rather than prioritizing high-sensitivity configurations (recall&#x003E;95%) that act as effective safety nets. Future benchmarks must penalize missed (serious) signals more heavily to reflect the operational realities of drug safety.</p><p>Beyond evaluation metrics, the reviewed literature reveals several recurring limitations. Linguistic and geographic bias in training data remains common. Downstream validation is often limited, and extracted ADE information is rarely leveraged in deeper analyses, while calibration is also infrequently assessed. Together, these issues constrain the generalizability and practical utility of LM-based pharmacovigilance systems. LM-based methods are appealing because they can support safety analyses across the drug development lifecycle while preserving existing practices. However, their value proposition depends on moving beyond isolated tasks toward demonstrable gains in workflow efficiency and patient safety.</p><p>Taken together, the evidence indicates that LM-based methods have evolved from representation learning into a diverse toolkit supporting both premarket safety prediction and postmarket ADE detection. While the field remains anchored in discriminative transformers and supervised training, generative LLMs are emerging as a complementary paradigm that could accelerate adaptation thanks to their zero-shot capabilities. Future progress is likely to depend strongly on robust generalizability and downstream validation. Moreover, there is a clear need for greater methodological convergence between chemical LMs and text-based LMs, particularly through multimodal approaches that incorporate chemical-, patient-, and regimen-level information. Currently, the bridge provided by LMs is methodological rather than functional; premarket models do not learn from postmarket text, and vice versa. A true paradigm shift will occur only when multimodal architectures are trained jointly on molecular structures and safety-related narratives. This would allow a model to analyze a chemical structure and directly generate its potential postmarket safety profile, effectively closing the feedback loop that currently takes years to traverse [<xref ref-type="bibr" rid="ref23">23</xref>]. In the context of safety prediction, such efforts would help bridge the gap between decontextualized, compound-centric predictions and the context-dependent determinants of ADE risk in real-world scenarios. This suggests that the performance ceiling in toxicity prediction is not algorithmic, but conceptual. By modeling molecules as isolated static entities, current LMs ignore the physiological context (eg, metabolism and genetics) that defines toxicity. Future breakthroughs will require moving from molecule-centric LMs to interaction-centric systems that embed compounds within virtual biological environments.</p></sec><sec id="s4-4"><title>Strengths and Limitations</title><p>This review has several limitations. First, the scope was deliberately narrowed to studies that explicitly use LM techniques. While this keeps the research questions we posed tractable, it inevitably underrepresents the large body of preclinical safety work that still relies on nonlinguistic DL (eg, pure graph or image models) and may therefore give the impression that the use of LMs is more mature than it really is [<xref ref-type="bibr" rid="ref18">18</xref>], or that it is the only approach to apply AI for drug safety. Another limitation lies in the fact that almost all of the papers ultimately included analyze English corpora, with only a handful making use of non-English corpora. This linguistic bias, reinforced by the exclusion of non-English papers, already criticized in earlier pharmacovigilance reviews [<xref ref-type="bibr" rid="ref16">16</xref>], limits the study&#x2019;s external validity in markets where social media posts in languages, such as Spanish, Portuguese, Hindi, and Arabic, dominate. This mirrors the selection bias that Chekroud et al [<xref ref-type="bibr" rid="ref89">89</xref>] have highlighted for efficacy prediction using clinical trials and probably inflates the apparent dominance of English-language, Twitter-based, postmarketing studies. From a methodological point of view, our search strings were compiled using high-level terms (eg, &#x201C;language model&#x201D;) and will have missed papers that mention only specific algorithms (eg, &#x201C;ELMo&#x201D; and &#x201C;BERT&#x201D;) without the umbrella &#x201C;LM&#x201D; label.</p></sec><sec id="s4-5"><title>Conclusions</title><p>While the application of LMs to ADE analysis in pharmaceutical research and development is still in its early stages, this scoping review highlights the field&#x2019;s rapid maturation and considerable potential. Our findings demonstrate that LMs can be integrated across various stages of the drug development lifecycle, from early toxicity prediction in the premarket phase to large-scale ADE detection in postmarket surveillance.</p><p>The reviewed studies indicate that recent advances in contextualized LMs and LLMs have led to meaningful improvements in the extraction, representation, and analysis of safety-related information from both molecular and textual data sources. As these methodologies continue to evolve, they show great promise in enhancing drug safety assessment, improving the efficiency of pharmacovigilance systems, and ultimately reducing preventable patient harm and health care costs.</p><p>Looking ahead, broader adoption of LLM-based approaches will depend on continued progress in model validation, interpretability, and integration into real-world regulatory and clinical workflows. With sustained methodological refinement and closer alignment with pharmacovigilance practice, LMs are well-positioned to play a transformative role in future drug safety monitoring and decision-making, thereby fostering greater trust and acceptance in therapeutic and regulatory settings.</p></sec></sec></body><back><notes><sec><title>Funding</title><p>This work was funded by the Innosuisse (project: 114.721 IP-ICT) and Swiss National Science Foundation (grant 10005385).</p></sec><sec><title>Data Availability</title><p>The datasets generated or analyzed during this study are available from the corresponding author on reasonable request.</p></sec></notes><fn-group><fn fn-type="con"><p>DT conceptualized the study, defined the methodology, and coordinated the research process. AY, OS, and DT performed the database searches and coordinated the screening process. IG, AY, OS, RK, and DT extracted item information from full texts. IG, AY, and DT performed the data analysis. OS, IG, AY, and DT authored the original draft. All authors reviewed and approved the manuscript.</p></fn><fn fn-type="conflict"><p>At the time of the submission, RK and GM are employees of Johnson &#x0026; Johnson and Cilag, respectively. The other authors declare no competing interests.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">ADE</term><def><p>adverse drug event</p></def></def-item><def-item><term id="abb2">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb3">AUROC</term><def><p>area under the receiver operating characteristic curve</p></def></def-item><def-item><term id="abb4">BERT</term><def><p>bidirectional encoder representations from transformer</p></def></def-item><def-item><term id="abb5">CHARMS</term><def><p>Critical Appraisal and Data Extraction for Systematic Reviews of Prediction Modeling Studies</p></def></def-item><def-item><term id="abb6">CNN</term><def><p>convolutional neural network</p></def></def-item><def-item><term id="abb7">CRF</term><def><p>conditional random field</p></def></def-item><def-item><term id="abb8">DL</term><def><p>deep learning</p></def></def-item><def-item><term id="abb9">EHR</term><def><p>electronic health record</p></def></def-item><def-item><term id="abb10">EL</term><def><p>entity linking</p></def></def-item><def-item><term id="abb11">GNN</term><def><p>graph neural network</p></def></def-item><def-item><term id="abb12">LLM</term><def><p>large language model</p></def></def-item><def-item><term id="abb13">LM</term><def><p>language model</p></def></def-item><def-item><term id="abb14">MedDRA</term><def><p>Medical Dictionary for Regulatory Activities</p></def></def-item><def-item><term id="abb15">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb16">NER</term><def><p>named entity recognition</p></def></def-item><def-item><term id="abb17">Pharma R&#x0026;D</term><def><p>pharmaceutical research and development</p></def></def-item><def-item><term id="abb18">PRISMA-ScR</term><def><p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses Extension for Scoping Reviews</p></def></def-item><def-item><term id="abb19">RE</term><def><p>relation extraction</p></def></def-item><def-item><term id="abb20">RNN</term><def><p>recurrent neural network</p></def></def-item><def-item><term id="abb21">SVM</term><def><p>support vector machine</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hwang</surname><given-names>TJ</given-names> </name><name name-style="western"><surname>Carpenter</surname><given-names>D</given-names> </name><name name-style="western"><surname>Lauffenburger</surname><given-names>JC</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>B</given-names> </name><name name-style="western"><surname>Franklin</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Kesselheim</surname><given-names>AS</given-names> </name></person-group><article-title>Failure of investigational drugs in late-stage clinical development and publication of trial results</article-title><source>JAMA Intern Med</source><year>2016</year><month>12</month><day>1</day><volume>176</volume><issue>12</issue><fpage>1826</fpage><lpage>1833</lpage><pub-id pub-id-type="doi">10.1001/jamainternmed.2016.6008</pub-id><pub-id pub-id-type="medline">27723879</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shehab</surname><given-names>N</given-names> </name><name name-style="western"><surname>Lovegrove</surname><given-names>MC</given-names> </name><name name-style="western"><surname>Geller</surname><given-names>AI</given-names> </name><name name-style="western"><surname>Rose</surname><given-names>KO</given-names> </name><name name-style="western"><surname>Weidle</surname><given-names>NJ</given-names> </name><name name-style="western"><surname>Budnitz</surname><given-names>DS</given-names> </name></person-group><article-title>US Emergency Department visits for outpatient adverse drug events, 2013-2014</article-title><source>JAMA</source><year>2016</year><month>11</month><day>22</day><volume>316</volume><issue>20</issue><fpage>2115</fpage><lpage>2125</lpage><pub-id pub-id-type="doi">10.1001/jama.2016.16201</pub-id><pub-id pub-id-type="medline">27893129</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Narayanan</surname><given-names>S</given-names> </name><name name-style="western"><surname>Mannam</surname><given-names>K</given-names> </name><name name-style="western"><surname>Achan</surname><given-names>P</given-names> </name><name name-style="western"><surname>Ramesh</surname><given-names>MV</given-names> </name><name name-style="western"><surname>Rangan</surname><given-names>PV</given-names> </name><name name-style="western"><surname>Rajan</surname><given-names>SP</given-names> </name></person-group><article-title>A contextual multi-task neural approach to medication and adverse events identification from clinical text</article-title><source>J Biomed Inform</source><year>2022</year><month>01</month><volume>125</volume><fpage>103960</fpage><pub-id pub-id-type="doi">10.1016/j.jbi.2021.103960</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vo</surname><given-names>AH</given-names> </name><name name-style="western"><surname>Van Vleet</surname><given-names>TR</given-names> </name><name name-style="western"><surname>Gupta</surname><given-names>RR</given-names> </name><name name-style="western"><surname>Liguori</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Rao</surname><given-names>MS</given-names> </name></person-group><article-title>An overview of machine learning and big data for drug toxicity evaluation</article-title><source>Chem Res Toxicol</source><year>2020</year><month>01</month><day>21</day><volume>33</volume><issue>1</issue><fpage>20</fpage><lpage>37</lpage><pub-id pub-id-type="doi">10.1021/acs.chemrestox.9b00227</pub-id><pub-id pub-id-type="medline">31625725</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yadesa</surname><given-names>TM</given-names> </name><name name-style="western"><surname>Kitutu</surname><given-names>FE</given-names> </name><name name-style="western"><surname>Deyno</surname><given-names>S</given-names> </name><name name-style="western"><surname>Ogwang</surname><given-names>PE</given-names> </name><name name-style="western"><surname>Tamukong</surname><given-names>R</given-names> </name><name name-style="western"><surname>Alele</surname><given-names>PE</given-names> </name></person-group><article-title>Prevalence, characteristics and predicting risk factors of adverse drug reactions among hospitalized older adults: a systematic review and meta-analysis</article-title><source>SAGE Open Med</source><year>2021</year><volume>9</volume><fpage>20503121211039099</fpage><pub-id pub-id-type="doi">10.1177/20503121211039099</pub-id><pub-id pub-id-type="medline">34422271</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Giri</surname><given-names>S</given-names> </name><name name-style="western"><surname>Bader</surname><given-names>A</given-names> </name></person-group><article-title>A low-cost, high-quality new drug discovery process using patient-derived induced pluripotent stem cells</article-title><source>Drug Discov Today</source><year>2015</year><month>01</month><volume>20</volume><issue>1</issue><fpage>37</fpage><lpage>49</lpage><pub-id pub-id-type="doi">10.1016/j.drudis.2014.10.011</pub-id><pub-id pub-id-type="medline">25448756</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Morgan</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Elangbam</surname><given-names>CS</given-names> </name><name name-style="western"><surname>Berens</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Use of animal models of human disease for nonclinical safety assessment of novel pharmaceuticals</article-title><source>Toxicol Pathol</source><year>2013</year><volume>41</volume><issue>3</issue><fpage>508</fpage><lpage>518</lpage><pub-id pub-id-type="doi">10.1177/0192623312457273</pub-id><pub-id pub-id-type="medline">22968286</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Marti&#x0107;-Kehl</surname><given-names>MI</given-names> </name><name name-style="western"><surname>Schibli</surname><given-names>R</given-names> </name><name name-style="western"><surname>Schubiger</surname><given-names>PA</given-names> </name></person-group><article-title>Can animal data predict human outcome? Problems and pitfalls of translational animal research</article-title><source>Eur J Nucl Med Mol Imaging</source><year>2012</year><month>09</month><volume>39</volume><issue>9</issue><fpage>1492</fpage><lpage>1496</lpage><pub-id pub-id-type="doi">10.1007/s00259-012-2175-z</pub-id><pub-id pub-id-type="medline">22790876</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kanato</surname><given-names>K</given-names> </name><name name-style="western"><surname>Nakamura</surname><given-names>K</given-names> </name><name name-style="western"><surname>Saito</surname><given-names>I</given-names> </name><etal/></person-group><article-title>Treatment-related deaths (TRD) in investigator-initiated cancer cooperative group trials: from the datasets of 44 studies (4,964 patients) by the Japan Clinical Oncology Group (JCOG)</article-title><source>J Clin Oncol</source><year>2009</year><month>05</month><day>20</day><volume>27</volume><issue>15_suppl</issue><fpage>6632</fpage><lpage>6632</lpage><pub-id pub-id-type="doi">10.1200/jco.2009.27.15_suppl.6632</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hazell</surname><given-names>L</given-names> </name><name name-style="western"><surname>Shakir</surname><given-names>SAW</given-names> </name></person-group><article-title>Under-reporting of adverse drug reactions</article-title><source>Drug Saf</source><year>2006</year><volume>29</volume><issue>5</issue><fpage>385</fpage><lpage>396</lpage><pub-id pub-id-type="doi">10.2165/00002018-200629050-00003</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gahr</surname><given-names>M</given-names> </name><name name-style="western"><surname>Eller</surname><given-names>J</given-names> </name><name name-style="western"><surname>Connemann</surname><given-names>BJ</given-names> </name><name name-style="western"><surname>Sch&#x00F6;nfeldt-Lecuona</surname><given-names>C</given-names> </name></person-group><article-title>Underreporting of adverse drug reactions: results from a survey among physicians</article-title><source>Eur Psychiatr</source><year>2017</year><month>04</month><volume>41</volume><issue>S1</issue><fpage>S369</fpage><lpage>S369</lpage><pub-id pub-id-type="doi">10.1016/j.eurpsy.2017.02.377</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Yazdani</surname><given-names>A</given-names> </name><name name-style="western"><surname>Rouhizadeh</surname><given-names>H</given-names> </name><name name-style="western"><surname>Bornet</surname><given-names>A</given-names> </name><name name-style="western"><surname>Teodoro</surname><given-names>D</given-names> </name></person-group><article-title>CONORM: context-aware entity normalization for adverse drug event detection</article-title><comment>Preprint posted online on  Sep 26, 2023</comment><pub-id pub-id-type="doi">10.1101/2023.09.26.23296150</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lavertu</surname><given-names>A</given-names> </name><name name-style="western"><surname>Vora</surname><given-names>B</given-names> </name><name name-style="western"><surname>Giacomini</surname><given-names>KM</given-names> </name><name name-style="western"><surname>Altman</surname><given-names>R</given-names> </name><name name-style="western"><surname>Rensi</surname><given-names>S</given-names> </name></person-group><article-title>A new era in pharmacovigilance: toward real-world data and digital monitoring</article-title><source>Clin Pharmacol Ther</source><year>2021</year><month>05</month><volume>109</volume><issue>5</issue><fpage>1197</fpage><lpage>1202</lpage><pub-id pub-id-type="doi">10.1002/cpt.2172</pub-id><pub-id pub-id-type="medline">33492663</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>De Abreu Ferreira</surname><given-names>R</given-names> </name><name name-style="western"><surname>Zhong</surname><given-names>S</given-names> </name><name name-style="western"><surname>Moureaud</surname><given-names>C</given-names> </name><etal/></person-group><article-title>A pilot, predictive surveillance model in pharmacovigilance using machine learning approaches</article-title><source>Adv Ther</source><year>2024</year><month>06</month><volume>41</volume><issue>6</issue><fpage>2435</fpage><lpage>2445</lpage><pub-id pub-id-type="doi">10.1007/s12325-024-02870-5</pub-id><pub-id pub-id-type="medline">38704799</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shool</surname><given-names>S</given-names> </name><name name-style="western"><surname>Adimi</surname><given-names>S</given-names> </name><name name-style="western"><surname>Saboori Amleshi</surname><given-names>R</given-names> </name><name name-style="western"><surname>Bitaraf</surname><given-names>E</given-names> </name><name name-style="western"><surname>Golpira</surname><given-names>R</given-names> </name><name name-style="western"><surname>Tara</surname><given-names>M</given-names> </name></person-group><article-title>A systematic review of large language model (LLM) evaluations in clinical medicine</article-title><source>BMC Med Inform Decis Mak</source><year>2025</year><month>03</month><day>7</day><volume>25</volume><issue>1</issue><fpage>117</fpage><pub-id pub-id-type="doi">10.1186/s12911-025-02954-4</pub-id><pub-id pub-id-type="medline">40055694</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Syrowatka</surname><given-names>A</given-names> </name><name name-style="western"><surname>Song</surname><given-names>W</given-names> </name><name name-style="western"><surname>Amato</surname><given-names>MG</given-names> </name><etal/></person-group><article-title>Key use cases for artificial intelligence to reduce the frequency of adverse drug events: a scoping review</article-title><source>Lancet Digit Health</source><year>2022</year><month>02</month><volume>4</volume><issue>2</issue><fpage>e137</fpage><lpage>e148</lpage><pub-id pub-id-type="doi">10.1016/S2589-7500(21)00229-6</pub-id><pub-id pub-id-type="medline">34836823</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>S</given-names> </name><name name-style="western"><surname>Kar</surname><given-names>S</given-names> </name></person-group><article-title>Application of artificial intelligence and machine learning in early detection of adverse drug reactions (ADRs) and drug-induced toxicity</article-title><source>Artif Intell Chem</source><year>2023</year><month>12</month><volume>1</volume><issue>2</issue><fpage>100011</fpage><pub-id pub-id-type="doi">10.1016/j.aichem.2023.100011</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Denck</surname><given-names>J</given-names> </name><name name-style="western"><surname>Ozkirimli</surname><given-names>E</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>K</given-names> </name></person-group><article-title>Machine-learning-based adverse drug event prediction from observational health data: a review</article-title><source>Drug Discov Today</source><year>2023</year><month>09</month><volume>28</volume><issue>9</issue><fpage>103715</fpage><pub-id pub-id-type="doi">10.1016/j.drudis.2023.103715</pub-id><pub-id pub-id-type="medline">37467879</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hu</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Zou</surname><given-names>D</given-names> </name><name name-style="western"><surname>He</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>T</given-names> </name></person-group><article-title>Predicting adverse drug event using machine learning based on electronic health records: a systematic review and meta-analysis</article-title><source>Front Pharmacol</source><year>2024</year><volume>15</volume><fpage>1497397</fpage><pub-id pub-id-type="doi">10.3389/fphar.2024.1497397</pub-id><pub-id pub-id-type="medline">39605909</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Teodoro</surname><given-names>D</given-names> </name><name name-style="western"><surname>Naderi</surname><given-names>N</given-names> </name><name name-style="western"><surname>Yazdani</surname><given-names>A</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>B</given-names> </name><name name-style="western"><surname>Bornet</surname><given-names>A</given-names> </name></person-group><article-title>A scoping review of artificial intelligence applications in clinical trial risk assessment</article-title><source>NPJ Digit Med</source><year>2025</year><month>07</month><day>30</day><volume>8</volume><issue>1</issue><fpage>486</fpage><pub-id pub-id-type="doi">10.1038/s41746-025-01886-7</pub-id><pub-id pub-id-type="medline">40731070</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Page</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>McKenzie</surname><given-names>JE</given-names> </name><name name-style="western"><surname>Bossuyt</surname><given-names>PM</given-names> </name><etal/></person-group><article-title>The PRISMA 2020 statement: an updated guideline for reporting systematic reviews</article-title><source>BMJ</source><year>2021</year><month>03</month><day>29</day><volume>372</volume><fpage>n71</fpage><pub-id pub-id-type="doi">10.1136/bmj.n71</pub-id><pub-id pub-id-type="medline">33782057</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="web"><article-title>Attribution 4.0 international (CC BY 4.0)</article-title><source>Creative Commons</source><access-date>2026-05-14</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link></comment></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yazdani</surname><given-names>A</given-names> </name><name name-style="western"><surname>Bornet</surname><given-names>A</given-names> </name><name name-style="western"><surname>Khlebnikov</surname><given-names>P</given-names> </name><etal/></person-group><article-title>An evaluation benchmark for adverse drug event prediction from clinical trial results</article-title><source>Sci Data</source><year>2025</year><month>03</month><day>11</day><volume>12</volume><issue>1</issue><fpage>424</fpage><pub-id pub-id-type="doi">10.1038/s41597-025-04718-1</pub-id><pub-id pub-id-type="medline">40069213</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Guan</surname><given-names>H</given-names> </name><name name-style="western"><surname>Devarakonda</surname><given-names>M</given-names> </name></person-group><article-title>Leveraging contextual information in extracting long distance relations from clinical notes</article-title><source>AMIA Annu Symp Proc</source><year>2019</year><volume>2019</volume><fpage>1051</fpage><lpage>1060</lpage><pub-id pub-id-type="medline">32308902</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yazdani</surname><given-names>A</given-names> </name><name name-style="western"><surname>Rouhizadeh</surname><given-names>H</given-names> </name><name name-style="western"><surname>Bornet</surname><given-names>A</given-names> </name><name name-style="western"><surname>Teodoro</surname><given-names>D</given-names> </name></person-group><article-title>Leveraging large language models for synthetic data generation to enhance adverse drug event detection in tweets</article-title><source>Stud Health Technol Inform</source><year>2025</year><month>05</month><day>15</day><volume>327</volume><fpage>778</fpage><lpage>782</lpage><pub-id pub-id-type="doi">10.3233/SHTI250465</pub-id><pub-id pub-id-type="medline">40380573</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Elbiach</surname><given-names>O</given-names> </name><name name-style="western"><surname>Grissette</surname><given-names>H</given-names> </name><name name-style="western"><surname>Nfaoui</surname><given-names>EH</given-names> </name></person-group><article-title>Leveraging transformer models for enhanced pharmacovigilance: a comparative analysis of ADR extraction from biomedical and social media texts</article-title><source>AI</source><year>2025</year><volume>6</volume><issue>2</issue><fpage>31</fpage><pub-id pub-id-type="doi">10.3390/ai6020031</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Martenot</surname><given-names>V</given-names> </name><name name-style="western"><surname>Masdeu</surname><given-names>V</given-names> </name><name name-style="western"><surname>Cupe</surname><given-names>J</given-names> </name><etal/></person-group><article-title>LiSA: an assisted literature search pipeline for detecting serious adverse drug events with deep learning</article-title><source>BMC Med Inform Decis Mak</source><year>2022</year><month>12</month><day>22</day><volume>22</volume><issue>1</issue><fpage>338</fpage><pub-id pub-id-type="doi">10.1186/s12911-022-02085-0</pub-id><pub-id pub-id-type="medline">36550485</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Karapetiantz</surname><given-names>P</given-names> </name><name name-style="western"><surname>Audeh</surname><given-names>B</given-names> </name><name name-style="western"><surname>Redjdal</surname><given-names>A</given-names> </name><name name-style="western"><surname>Tiffet</surname><given-names>T</given-names> </name><name name-style="western"><surname>Bousquet</surname><given-names>C</given-names> </name><name name-style="western"><surname>Jaulent</surname><given-names>MC</given-names> </name></person-group><article-title>Monitoring adverse drug events in web forums: evaluation of a pipeline and use case study</article-title><source>J Med Internet Res</source><year>2024</year><month>06</month><day>18</day><volume>26</volume><fpage>e46176</fpage><pub-id pub-id-type="doi">10.2196/46176</pub-id><pub-id pub-id-type="medline">38888956</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nikfarjam</surname><given-names>A</given-names> </name><name name-style="western"><surname>Sarker</surname><given-names>A</given-names> </name><name name-style="western"><surname>O&#x2019;Connor</surname><given-names>K</given-names> </name><name name-style="western"><surname>Ginn</surname><given-names>R</given-names> </name><name name-style="western"><surname>Gonzalez</surname><given-names>G</given-names> </name></person-group><article-title>Pharmacovigilance from social media: mining adverse drug reaction mentions using sequence labeling with word embedding cluster features</article-title><source>J Am Med Inform Assoc</source><year>2015</year><month>05</month><volume>22</volume><issue>3</issue><fpage>671</fpage><lpage>681</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocu041</pub-id><pub-id pub-id-type="medline">25755127</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Jamil</surname><given-names>S</given-names> </name><name name-style="western"><surname>Dabad</surname><given-names>A</given-names></name><name name-style="western"><surname>Reddy</surname><given-names>B</given-names> </name><name name-style="western"><surname>Saha</surname><given-names>S</given-names> </name><name name-style="western"><surname>Misra</surname><given-names>R</given-names> </name><name name-style="western"><surname>Shakur</surname><given-names>AA</given-names></name></person-group><article-title>GASCADE: grouped summarization of adverse drug event for enhanced cancer pharmacovigilance</article-title><year>2025</year><conf-name>European Conference on Information Retrieval</conf-name><conf-date>Apr 6-10, 2025</conf-date><conf-loc>Lucca, Italy</conf-loc><publisher-name>Springer</publisher-name><pub-id pub-id-type="doi">10.1007/978-3-031-88717-8_17</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Scaboro</surname><given-names>S</given-names> </name><name name-style="western"><surname>Portelli</surname><given-names>B</given-names> </name><name name-style="western"><surname>Chersoni</surname><given-names>E</given-names> </name><name name-style="western"><surname>Santus</surname><given-names>E</given-names> </name><name name-style="western"><surname>Serra</surname><given-names>G</given-names> </name></person-group><article-title>Extensive evaluation of transformer-based architectures for adverse drug events extraction</article-title><source>Knowl Based Syst</source><year>2023</year><month>09</month><volume>275</volume><fpage>110675</fpage><pub-id pub-id-type="doi">10.1016/j.knosys.2023.110675</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hu</surname><given-names>K</given-names> </name><name name-style="western"><surname>He</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wei</surname><given-names>J</given-names> </name><etal/></person-group><article-title>BFGTP: a BERT-guided two-stage molecular representation learning framework for toxicity prediction</article-title><source>IEEE J Biomed Health Inform</source><year>2025</year><month>10</month><volume>29</volume><issue>10</issue><fpage>6960</fpage><lpage>6970</lpage><pub-id pub-id-type="doi">10.1109/JBHI.2025.3556766</pub-id><pub-id pub-id-type="medline">40168218</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ha</surname><given-names>S</given-names> </name><name name-style="western"><surname>Bang</surname><given-names>D</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>S</given-names> </name></person-group><article-title>Fate-tox: fragment attention transformer for E(3)-equivariant multi-organ toxicity prediction</article-title><source>J Cheminform</source><year>2025</year><month>05</month><day>14</day><volume>17</volume><issue>1</issue><fpage>74</fpage><pub-id pub-id-type="doi">10.1186/s13321-025-01012-5</pub-id><pub-id pub-id-type="medline">40369624</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>He</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Lv</surname><given-names>X</given-names> </name><name name-style="western"><surname>Long</surname><given-names>W</given-names> </name><name name-style="western"><surname>Zhai</surname><given-names>S</given-names> </name><name name-style="western"><surname>Li</surname><given-names>M</given-names> </name><name name-style="western"><surname>Wen</surname><given-names>Z</given-names> </name></person-group><article-title>ToxBERT: an explainable AI framework for enhancing prediction of adverse drug reactions and structural insights</article-title><source>J Pharm Anal</source><year>2025</year><month>08</month><volume>15</volume><issue>8</issue><fpage>101387</fpage><pub-id pub-id-type="doi">10.1016/j.jpha.2025.101387</pub-id><pub-id pub-id-type="medline">40979546</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Guan</surname><given-names>J</given-names> </name><name name-style="western"><surname>Xie</surname><given-names>P</given-names> </name><name name-style="western"><surname>Meng</surname><given-names>D</given-names> </name><etal/></person-group><article-title>ToxiPep: peptide toxicity prediction via fusion of context-aware representation and atomic-level graph</article-title><source>Comput Struct Biotechnol J</source><year>2025</year><volume>27</volume><fpage>2347</fpage><lpage>2358</lpage><pub-id pub-id-type="doi">10.1016/j.csbj.2025.05.039</pub-id><pub-id pub-id-type="medline">40529180</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ding</surname><given-names>X</given-names> </name><name name-style="western"><surname>Mower</surname><given-names>J</given-names> </name><name name-style="western"><surname>Subramanian</surname><given-names>D</given-names> </name><name name-style="western"><surname>Cohen</surname><given-names>T</given-names> </name></person-group><article-title>Augmenting aer2vec: enriching distributed representations of adverse event report data with orthographic and lexical information</article-title><source>J Biomed Inform</source><year>2021</year><month>07</month><volume>119</volume><fpage>103833</fpage><pub-id pub-id-type="doi">10.1016/j.jbi.2021.103833</pub-id><pub-id pub-id-type="medline">34111555</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ahmad</surname><given-names>F</given-names> </name><name name-style="western"><surname>Abbasi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Kitchens</surname><given-names>B</given-names> </name><name name-style="western"><surname>Adjeroh</surname><given-names>DA</given-names> </name><name name-style="western"><surname>Zeng</surname><given-names>D</given-names> </name></person-group><article-title>Deep learning for adverse event detection from web search</article-title><source>IEEE Trans Knowl Data Eng</source><year>2020</year><volume>34</volume><fpage>1</fpage><lpage>1</lpage><pub-id pub-id-type="doi">10.1109/TKDE.2020.3017786</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mower</surname><given-names>J</given-names> </name><name name-style="western"><surname>Bernstam</surname><given-names>E</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>H</given-names> </name><name name-style="western"><surname>Myneni</surname><given-names>S</given-names> </name><name name-style="western"><surname>Subramanian</surname><given-names>D</given-names> </name><name name-style="western"><surname>Cohen</surname><given-names>T</given-names> </name></person-group><article-title>Improving pharmacovigilance signal detection from clinical notes with locality sensitive neural concept embeddings</article-title><source>AMIA Jt Summits Transl Sci Proc</source><year>2022</year><volume>2022</volume><fpage>349</fpage><lpage>358</lpage><pub-id pub-id-type="medline">35854716</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lavertu</surname><given-names>A</given-names> </name><name name-style="western"><surname>Hamamsy</surname><given-names>T</given-names> </name><name name-style="western"><surname>Altman</surname><given-names>RB</given-names> </name></person-group><article-title>Quantifying the severity of adverse drug reactions using social media: network analysis</article-title><source>J Med Internet Res</source><year>2021</year><month>10</month><day>21</day><volume>23</volume><issue>10</issue><fpage>e27714</fpage><pub-id pub-id-type="doi">10.2196/27714</pub-id><pub-id pub-id-type="medline">34673524</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="web"><article-title>The drug development process</article-title><source>US Food and Drug Administration</source><year>2018</year><access-date>2026-05-12</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.fda.gov/patients/learn-about-drug-and-device-approvals/drug-development-process">https://www.fda.gov/patients/learn-about-drug-and-device-approvals/drug-development-process</ext-link></comment></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jung</surname><given-names>W</given-names> </name><name name-style="western"><surname>Goo</surname><given-names>S</given-names> </name><name name-style="western"><surname>Hwang</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Absorption distribution metabolism excretion and toxicity property prediction utilizing a pre-trained natural language processing model and its applications in early-stage drug development</article-title><source>Pharmaceuticals (Basel)</source><year>2024</year><month>03</month><day>17</day><volume>17</volume><issue>3</issue><fpage>382</fpage><pub-id pub-id-type="doi">10.3390/ph17030382</pub-id><pub-id pub-id-type="medline">38543168</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shao</surname><given-names>C</given-names> </name><name name-style="western"><surname>Shao</surname><given-names>F</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>S</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>R</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>T</given-names> </name></person-group><article-title>An evolved transformer model for ADME/Tox prediction</article-title><source>Electronics (Basel)</source><year>2024</year><volume>13</volume><issue>3</issue><fpage>624</fpage><pub-id pub-id-type="doi">10.3390/electronics13030624</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>S</given-names> </name><name name-style="western"><surname>Ren</surname><given-names>J</given-names> </name><name name-style="western"><surname>Liang</surname><given-names>Y</given-names> </name></person-group><article-title>An innovative peptide toxicity prediction model based on multi-scale convolutional neural network and residual connection</article-title><source>Bioinformatics</source><year>2025</year><month>10</month><day>2</day><volume>41</volume><issue>10</issue><fpage>btaf462</fpage><pub-id pub-id-type="doi">10.1093/bioinformatics/btaf462</pub-id><pub-id pub-id-type="medline">40845156</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>YQ</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>T</given-names> </name><name name-style="western"><surname>Song</surname><given-names>ZQ</given-names> </name><etal/></person-group><article-title>Application of large language models in drug-induced osteotoxicity prediction</article-title><source>J Chem Inf Model</source><year>2025</year><month>04</month><day>14</day><volume>65</volume><issue>7</issue><fpage>3370</fpage><lpage>3379</lpage><pub-id pub-id-type="doi">10.1021/acs.jcim.5c00275</pub-id><pub-id pub-id-type="medline">40114317</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cai</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>W</given-names> </name><etal/></person-group><article-title>Comprehensive drug-likeness prediction using a pretrained transformer model and multitask learning</article-title><source>J Chem Inf Model</source><year>2025</year><month>06</month><day>9</day><volume>65</volume><issue>11</issue><fpage>5370</fpage><lpage>5383</lpage><pub-id pub-id-type="doi">10.1021/acs.jcim.5c00455</pub-id><pub-id pub-id-type="medline">40393046</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Aksamit</surname><given-names>N</given-names> </name><name name-style="western"><surname>Hou</surname><given-names>J</given-names> </name><name name-style="western"><surname>Li</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Ombuki-Berman</surname><given-names>B</given-names> </name></person-group><article-title>Integrating transformers and many-objective optimization for drug design</article-title><source>BMC Bioinformatics</source><year>2024</year><month>06</month><day>8</day><volume>25</volume><issue>1</issue><fpage>208</fpage><pub-id pub-id-type="doi">10.1186/s12859-024-05822-6</pub-id><pub-id pub-id-type="medline">38849719</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jiao</surname><given-names>S</given-names> </name><name name-style="western"><surname>Ye</surname><given-names>X</given-names> </name><name name-style="western"><surname>Sakurai</surname><given-names>T</given-names> </name><name name-style="western"><surname>Zou</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Han</surname><given-names>W</given-names> </name><name name-style="western"><surname>Zhan</surname><given-names>C</given-names> </name></person-group><article-title>Integration of pre-trained protein language models with equivariant graph neural networks for peptide toxicity prediction</article-title><source>BMC Biol</source><year>2025</year><month>07</month><day>28</day><volume>23</volume><issue>1</issue><fpage>229</fpage><pub-id pub-id-type="doi">10.1186/s12915-025-02329-1</pub-id><pub-id pub-id-type="medline">40721793</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Xiu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Yan</surname><given-names>W</given-names> </name><etal/></person-group><article-title>Large language models as tools for molecular toxicity prediction: AI insights into cardiotoxicity</article-title><source>J Chem Inf Model</source><year>2025</year><month>03</month><day>10</day><volume>65</volume><issue>5</issue><fpage>2268</fpage><lpage>2282</lpage><pub-id pub-id-type="doi">10.1021/acs.jcim.4c01371</pub-id><pub-id pub-id-type="medline">39982968</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dasgupta</surname><given-names>S</given-names> </name><name name-style="western"><surname>Jayagopal</surname><given-names>A</given-names> </name><name name-style="western"><surname>Jun Hong</surname><given-names>AL</given-names> </name><name name-style="western"><surname>Mariappan</surname><given-names>R</given-names> </name><name name-style="western"><surname>Rajan</surname><given-names>V</given-names> </name></person-group><article-title>Adverse drug event prediction using noisy literature-derived knowledge graphs: algorithm development and validation</article-title><source>JMIR Med Inform</source><year>2021</year><month>10</month><day>25</day><volume>9</volume><issue>10</issue><fpage>e32730</fpage><pub-id pub-id-type="doi">10.2196/32730</pub-id><pub-id pub-id-type="medline">34694230</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>CS</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>PJ</given-names> </name><name name-style="western"><surname>Cheng</surname><given-names>CL</given-names> </name><name name-style="western"><surname>Tai</surname><given-names>SH</given-names> </name><name name-style="western"><surname>Kao Yang</surname><given-names>YH</given-names> </name><name name-style="western"><surname>Chiang</surname><given-names>JH</given-names> </name></person-group><article-title>Detecting potential adverse drug reactions using a deep neural network model</article-title><source>J Med Internet Res</source><year>2019</year><month>02</month><day>6</day><volume>21</volume><issue>2</issue><fpage>e11016</fpage><pub-id pub-id-type="doi">10.2196/11016</pub-id><pub-id pub-id-type="medline">30724742</pub-id></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mazuz</surname><given-names>E</given-names> </name><name name-style="western"><surname>Shtar</surname><given-names>G</given-names> </name><name name-style="western"><surname>Kutsky</surname><given-names>N</given-names> </name><name name-style="western"><surname>Rokach</surname><given-names>L</given-names> </name><name name-style="western"><surname>Shapira</surname><given-names>B</given-names> </name></person-group><article-title>Pretrained transformer models for predicting the withdrawal of drugs from the market</article-title><source>Bioinformatics</source><year>2023</year><month>08</month><day>1</day><volume>39</volume><issue>8</issue><fpage>btad519</fpage><pub-id pub-id-type="doi">10.1093/bioinformatics/btad519</pub-id><pub-id pub-id-type="medline">37610328</pub-id></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ma</surname><given-names>H</given-names> </name><name name-style="western"><surname>An</surname><given-names>W</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>H</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>R</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>J</given-names> </name></person-group><article-title>Deep graph learning with property augmentation for predicting drug-induced liver injury</article-title><source>Chem Res Toxicol</source><year>2021</year><month>02</month><day>15</day><volume>34</volume><issue>2</issue><fpage>495</fpage><lpage>506</lpage><pub-id pub-id-type="doi">10.1021/acs.chemrestox.0c00322</pub-id><pub-id pub-id-type="medline">33347312</pub-id></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kurosaki</surname><given-names>K</given-names> </name><name name-style="western"><surname>Uesawa</surname><given-names>Y</given-names> </name></person-group><article-title>Development of in silico prediction models for drug-induced liver malignant tumors based on the activity of molecular initiating events: biologically interpretable features</article-title><source>J Toxicol Sci</source><year>2022</year><volume>47</volume><issue>3</issue><fpage>89</fpage><lpage>98</lpage><pub-id pub-id-type="doi">10.2131/jts.47.89</pub-id><pub-id pub-id-type="medline">35236804</pub-id></nlm-citation></ref><ref id="ref54"><label>54</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Feng</surname><given-names>C</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>H</given-names> </name><name name-style="western"><surname>Yuan</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Gene expression data based deep learning model for accurate prediction of drug-induced liver injury in advance</article-title><source>J Chem Inf Model</source><year>2019</year><month>07</month><day>22</day><volume>59</volume><issue>7</issue><fpage>3240</fpage><lpage>3250</lpage><pub-id pub-id-type="doi">10.1021/acs.jcim.9b00143</pub-id><pub-id pub-id-type="medline">31188585</pub-id></nlm-citation></ref><ref id="ref55"><label>55</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nguyen-Vo</surname><given-names>TH</given-names> </name><name name-style="western"><surname>Nguyen</surname><given-names>L</given-names> </name><name name-style="western"><surname>Do</surname><given-names>N</given-names> </name><etal/></person-group><article-title>Predicting drug-induced liver injury using convolutional neural network and molecular fingerprint-embedded features</article-title><source>ACS Omega</source><year>2020</year><month>10</month><day>6</day><volume>5</volume><issue>39</issue><fpage>25432</fpage><lpage>25439</lpage><pub-id pub-id-type="doi">10.1021/acsomega.0c03866</pub-id><pub-id pub-id-type="medline">33043223</pub-id></nlm-citation></ref><ref id="ref56"><label>56</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fu</surname><given-names>L</given-names> </name><name name-style="western"><surname>Shi</surname><given-names>S</given-names> </name><name name-style="western"><surname>Yi</surname><given-names>J</given-names> </name><etal/></person-group><article-title>ADMETlab 3.0: an updated comprehensive online ADMET prediction platform enhanced with broader coverage, improved performance, API functionality and decision support</article-title><source>Nucleic Acids Res</source><year>2024</year><month>07</month><day>5</day><volume>52</volume><issue>W1</issue><fpage>W422</fpage><lpage>W431</lpage><pub-id pub-id-type="doi">10.1093/nar/gkae236</pub-id><pub-id pub-id-type="medline">38572755</pub-id></nlm-citation></ref><ref id="ref57"><label>57</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Barratt</surname><given-names>MD</given-names> </name></person-group><article-title>Prediction of toxicity from chemical structure</article-title><source>Cell Biol Toxicol</source><year>2000</year><volume>16</volume><issue>1</issue><fpage>1</fpage><lpage>13</lpage><pub-id pub-id-type="doi">10.1023/a:1007676602908</pub-id><pub-id pub-id-type="medline">10890502</pub-id></nlm-citation></ref><ref id="ref58"><label>58</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wunnava</surname><given-names>S</given-names> </name><name name-style="western"><surname>Qin</surname><given-names>X</given-names> </name><name name-style="western"><surname>Kakar</surname><given-names>T</given-names> </name><name name-style="western"><surname>Sen</surname><given-names>C</given-names> </name><name name-style="western"><surname>Rundensteiner</surname><given-names>EA</given-names> </name><name name-style="western"><surname>Kong</surname><given-names>X</given-names> </name></person-group><article-title>Adverse drug event detection from electronic health records using hierarchical recurrent neural networks with dual-level embedding</article-title><source>Drug Saf</source><year>2019</year><month>01</month><volume>42</volume><issue>1</issue><fpage>113</fpage><lpage>122</lpage><pub-id pub-id-type="doi">10.1007/s40264-018-0765-9</pub-id><pub-id pub-id-type="medline">30649736</pub-id></nlm-citation></ref><ref id="ref59"><label>59</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sboev</surname><given-names>A</given-names> </name><name name-style="western"><surname>Rybka</surname><given-names>R</given-names> </name><name name-style="western"><surname>Gryaznov</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Adverse drug reaction concept normalization in Russian-language reviews of internet users</article-title><source>Big Data Cogn Comput</source><year>2022</year><volume>6</volume><issue>4</issue><fpage>145</fpage><pub-id pub-id-type="doi">10.3390/bdcc6040145</pub-id></nlm-citation></ref><ref id="ref60"><label>60</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>H</given-names> </name><name name-style="western"><surname>Zheng</surname><given-names>W</given-names> </name></person-group><article-title>An effective emotional expression and knowledge-enhanced method for detecting adverse drug reactions</article-title><source>IEEE Access</source><year>2020</year><volume>8</volume><fpage>87083</fpage><lpage>87093</lpage><pub-id pub-id-type="doi">10.1109/ACCESS.2020.2993169</pub-id></nlm-citation></ref><ref id="ref61"><label>61</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Roosan</surname><given-names>D</given-names> </name><name name-style="western"><surname>Law</surname><given-names>AV</given-names> </name><name name-style="western"><surname>Roosan</surname><given-names>MR</given-names> </name><name name-style="western"><surname>Li</surname><given-names>Y</given-names> </name></person-group><article-title>Artificial intelligent context-aware machine-learning tool to detect adverse drug events from social media platforms</article-title><source>J Med Toxicol</source><year>2022</year><month>10</month><volume>18</volume><issue>4</issue><fpage>311</fpage><lpage>320</lpage><pub-id pub-id-type="doi">10.1007/s13181-022-00906-2</pub-id><pub-id pub-id-type="medline">36097239</pub-id></nlm-citation></ref><ref id="ref62"><label>62</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>S</given-names> </name><name name-style="western"><surname>Kang</surname><given-names>T</given-names> </name><name name-style="western"><surname>Chung</surname><given-names>TK</given-names> </name><etal/></person-group><article-title>Automatic extraction of comprehensive drug safety information from adverse drug event narratives in the Korea adverse event reporting system using natural language processing techniques</article-title><source>Drug Saf</source><year>2023</year><month>08</month><volume>46</volume><issue>8</issue><fpage>781</fpage><lpage>795</lpage><pub-id pub-id-type="doi">10.1007/s40264-023-01323-2</pub-id><pub-id pub-id-type="medline">37330415</pub-id></nlm-citation></ref><ref id="ref63"><label>63</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Elbiach</surname><given-names>O</given-names> </name><name name-style="western"><surname>Grissette</surname><given-names>H</given-names> </name><name name-style="western"><surname>Nfaoui</surname><given-names>EH</given-names> </name></person-group><article-title>Benchmarking large language models for adverse drug reaction extraction in social media and clinical texts</article-title><source>Results Eng</source><year>2025</year><month>12</month><volume>28</volume><fpage>107362</fpage><pub-id pub-id-type="doi">10.1016/j.rineng.2025.107362</pub-id></nlm-citation></ref><ref id="ref64"><label>64</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wu</surname><given-names>H</given-names> </name><name name-style="western"><surname>Ji</surname><given-names>J</given-names> </name><name name-style="western"><surname>Tian</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Chinese-named entity recognition from adverse drug event records: radical embedding-combined dynamic embedding-based BERT in a bidirectional long short-term conditional random field (Bi-LSTM-CRF) model</article-title><source>JMIR Med Inform</source><year>2021</year><month>12</month><day>1</day><volume>9</volume><issue>12</issue><fpage>e26407</fpage><pub-id pub-id-type="doi">10.2196/26407</pub-id><pub-id pub-id-type="medline">34855616</pub-id></nlm-citation></ref><ref id="ref65"><label>65</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cocos</surname><given-names>A</given-names> </name><name name-style="western"><surname>Fiks</surname><given-names>AG</given-names> </name><name name-style="western"><surname>Masino</surname><given-names>AJ</given-names> </name></person-group><article-title>Deep learning for pharmacovigilance: recurrent neural network architectures for labeling adverse drug reactions in Twitter posts</article-title><source>J Am Med Inform Assoc</source><year>2017</year><month>07</month><day>1</day><volume>24</volume><issue>4</issue><fpage>813</fpage><lpage>821</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocw180</pub-id><pub-id pub-id-type="medline">28339747</pub-id></nlm-citation></ref><ref id="ref66"><label>66</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Henriksson</surname><given-names>A</given-names> </name><name name-style="western"><surname>Kvist</surname><given-names>M</given-names> </name><name name-style="western"><surname>Dalianis</surname><given-names>H</given-names> </name><name name-style="western"><surname>Duneld</surname><given-names>M</given-names> </name></person-group><article-title>Identifying adverse drug event information in clinical notes with distributional semantic representations of context</article-title><source>J Biomed Inform</source><year>2015</year><month>10</month><volume>57</volume><fpage>333</fpage><lpage>349</lpage><pub-id pub-id-type="doi">10.1016/j.jbi.2015.08.013</pub-id></nlm-citation></ref><ref id="ref67"><label>67</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kopacheva</surname><given-names>E</given-names> </name><name name-style="western"><surname>Henriksson</surname><given-names>A</given-names> </name><name name-style="western"><surname>Dalianis</surname><given-names>H</given-names> </name><name name-style="western"><surname>Hammar</surname><given-names>T</given-names> </name><name name-style="western"><surname>Lincke</surname><given-names>A</given-names> </name></person-group><article-title>Identifying adverse drug events in clinical text using fine-tuned clinical language models: machine learning study</article-title><source>JMIR Form Res</source><year>2025</year><month>09</month><day>11</day><volume>9</volume><fpage>e71949</fpage><pub-id pub-id-type="doi">10.2196/71949</pub-id><pub-id pub-id-type="medline">40934508</pub-id></nlm-citation></ref><ref id="ref68"><label>68</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rawat</surname><given-names>BPS</given-names> </name><name name-style="western"><surname>Jagannatha</surname><given-names>A</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>F</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>H</given-names> </name></person-group><article-title>Inferring ADR causality by predicting the Naranjo Score from clinical notes</article-title><source>AMIA Annu Symp Proc</source><year>2020</year><volume>2020</volume><fpage>1041</fpage><lpage>1049</lpage><pub-id pub-id-type="medline">33936480</pub-id></nlm-citation></ref><ref id="ref69"><label>69</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Karapetian</surname><given-names>K</given-names> </name><name name-style="western"><surname>Jeon</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Kwon</surname><given-names>JW</given-names> </name><name name-style="western"><surname>Suh</surname><given-names>YK</given-names> </name></person-group><article-title>Supervised relation extraction between suicide-related entities and drugs: development and usability study of an annotated PubMed corpus</article-title><source>J Med Internet Res</source><year>2023</year><month>03</month><day>8</day><volume>25</volume><fpage>e41100</fpage><pub-id pub-id-type="doi">10.2196/41100</pub-id><pub-id pub-id-type="medline">36884281</pub-id></nlm-citation></ref><ref id="ref70"><label>70</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Gao</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Ji</surname><given-names>S</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>T</given-names> </name><name name-style="western"><surname>Tiwari</surname><given-names>P</given-names> </name><name name-style="western"><surname>Marttinen</surname><given-names>P</given-names> </name></person-group><article-title>Contextualized graph embeddings for adverse drug event detection</article-title><conf-name>Machine Learning and Knowledge Discovery in Databases: European Conference</conf-name><conf-date>Sep 19-23, 2022</conf-date><pub-id pub-id-type="doi">10.1007/978-3-031-26390-3_35</pub-id></nlm-citation></ref><ref id="ref71"><label>71</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Masino</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>Forsyth</surname><given-names>D</given-names> </name><name name-style="western"><surname>Fiks</surname><given-names>AG</given-names> </name></person-group><article-title>Detectingadverse drug reactions on Twitter with convolutional neural networks and word embedding features</article-title><source>J Healthc Inform Res</source><year>2018</year><month>06</month><volume>2</volume><issue>1-2</issue><fpage>25</fpage><lpage>43</lpage><pub-id pub-id-type="doi">10.1007/s41666-018-0018-9</pub-id><pub-id pub-id-type="medline">35415401</pub-id></nlm-citation></ref><ref id="ref72"><label>72</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>McMaster</surname><given-names>C</given-names> </name><name name-style="western"><surname>Chan</surname><given-names>J</given-names> </name><name name-style="western"><surname>Liew</surname><given-names>DFL</given-names> </name><etal/></person-group><article-title>Developing a deep learning natural language processing algorithm for automated reporting of adverse drug reactions</article-title><source>J Biomed Inform</source><year>2023</year><month>01</month><volume>137</volume><fpage>104265</fpage><pub-id pub-id-type="doi">10.1016/j.jbi.2022.104265</pub-id></nlm-citation></ref><ref id="ref73"><label>73</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Bera</surname><given-names>A</given-names> </name><name name-style="western"><surname>Das</surname><given-names>R</given-names> </name><name name-style="western"><surname>Ghosh</surname><given-names>S</given-names> </name><name name-style="western"><surname>Chakraborty</surname><given-names>R</given-names> </name><name name-style="western"><surname>Mitra</surname><given-names>I</given-names> </name><name name-style="western"><surname>Nandy</surname><given-names>P</given-names> </name></person-group><article-title>Harnessing transformers for detecting adverse drug reaction and customized causality explanation using generative AI</article-title><conf-name>2023 7th International Conference on Computing, Communication, Control and Automation (ICCUBEA)</conf-name><conf-date>Aug 18-19, 2023</conf-date><pub-id pub-id-type="doi">10.1109/ICCUBEA58933.2023.10392249</pub-id></nlm-citation></ref><ref id="ref74"><label>74</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>JY</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>WP</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>KD</given-names> </name></person-group><article-title>Predicting adverse drug reactions from social media posts: data balance, feature selection and deep learning</article-title><source>Healthcare (Basel)</source><year>2022</year><month>03</month><day>25</day><volume>10</volume><issue>4</issue><fpage>618</fpage><pub-id pub-id-type="doi">10.3390/healthcare10040618</pub-id><pub-id pub-id-type="medline">35455795</pub-id></nlm-citation></ref><ref id="ref75"><label>75</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Martin</surname><given-names>GL</given-names> </name><name name-style="western"><surname>Jouganous</surname><given-names>J</given-names> </name><name name-style="western"><surname>Savidan</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Validation of artificial intelligence to support the automatic coding of patient adverse drug reaction reports, using nationwide pharmacovigilance data</article-title><source>Drug Saf</source><year>2022</year><month>05</month><volume>45</volume><issue>5</issue><fpage>535</fpage><lpage>548</lpage><pub-id pub-id-type="doi">10.1007/s40264-022-01153-8</pub-id><pub-id pub-id-type="medline">35579816</pub-id></nlm-citation></ref><ref id="ref76"><label>76</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wegner</surname><given-names>P</given-names> </name><name name-style="western"><surname>Fr&#x00F6;hlich</surname><given-names>H</given-names> </name><name name-style="western"><surname>Madan</surname><given-names>S</given-names> </name></person-group><article-title>Evaluating knowledge fusion models on detecting adverse drug events in text</article-title><source>PLOS Digit Health</source><year>2025</year><month>03</month><volume>4</volume><issue>3</issue><fpage>e0000468</fpage><pub-id pub-id-type="doi">10.1371/journal.pdig.0000468</pub-id><pub-id pub-id-type="medline">40100877</pub-id></nlm-citation></ref><ref id="ref77"><label>77</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rathore</surname><given-names>AS</given-names> </name><name name-style="western"><surname>Kumar</surname><given-names>N</given-names> </name><name name-style="western"><surname>Choudhury</surname><given-names>S</given-names> </name><name name-style="western"><surname>Mehta</surname><given-names>NK</given-names> </name><name name-style="western"><surname>Raghava</surname><given-names>GPS</given-names> </name></person-group><article-title>Prediction of hemolytic peptides and their hemolytic concentration</article-title><source>Commun Biol</source><year>2025</year><month>02</month><day>4</day><volume>8</volume><issue>1</issue><fpage>176</fpage><pub-id pub-id-type="doi">10.1038/s42003-025-07615-w</pub-id><pub-id pub-id-type="medline">39905233</pub-id></nlm-citation></ref><ref id="ref78"><label>78</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Harrison</surname><given-names>J</given-names> </name><name name-style="western"><surname>Mozzicato</surname><given-names>P</given-names> </name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Aronson</surname><given-names>JK</given-names> </name><name name-style="western"><surname>Aronson</surname><given-names>JK</given-names> </name></person-group><article-title>MedDRA&#x00AE;: the tale of a terminology</article-title><source>Side Effects of Drugs Annual</source><year>2009</year><volume>31</volume><publisher-name>Elsevier</publisher-name><pub-id pub-id-type="doi">10.1016/S0378-6080(09)03160-2</pub-id></nlm-citation></ref><ref id="ref79"><label>79</label><nlm-citation citation-type="web"><article-title>Guidelines for ATC classification and DDD assignment</article-title><source>World Health Organization Collaborating Centre for Drug Statistics Methodology</source><year>2000</year><access-date>2026-06-10</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://atcddd.fhi.no/atc_ddd_index_and_guidelines/guidelines/">https://atcddd.fhi.no/atc_ddd_index_and_guidelines/guidelines/</ext-link></comment></nlm-citation></ref><ref id="ref80"><label>80</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhao</surname><given-names>H</given-names> </name><name name-style="western"><surname>Li</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>J</given-names> </name></person-group><article-title>A convolutional neural network and graph convolutional network-based method for predicting the classification of anatomical therapeutic chemicals</article-title><source>Bioinformatics</source><year>2021</year><month>09</month><day>29</day><volume>37</volume><issue>18</issue><fpage>2841</fpage><lpage>2847</lpage><pub-id pub-id-type="doi">10.1093/bioinformatics/btab204</pub-id><pub-id pub-id-type="medline">33769479</pub-id></nlm-citation></ref><ref id="ref81"><label>81</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>L</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zhou</surname><given-names>Y</given-names> </name></person-group><article-title>PDATC-NCPMKL: predicting drug&#x2019;s anatomical therapeutic chemical (ATC) codes based on network consistency projection and multiple kernel learning</article-title><source>Comput Biol Med</source><year>2024</year><month>02</month><volume>169</volume><fpage>107862</fpage><pub-id pub-id-type="doi">10.1016/j.compbiomed.2023.107862</pub-id><pub-id pub-id-type="medline">38150886</pub-id></nlm-citation></ref><ref id="ref82"><label>82</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Grafton</surname><given-names>F</given-names> </name><name name-style="western"><surname>Ho</surname><given-names>J</given-names> </name><name name-style="western"><surname>Ranjbarvaziri</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Deep learning detects cardiotoxicity in a high-content screen with induced pluripotent stem cell-derived cardiomyocytes</article-title><source>Elife</source><year>2021</year><month>08</month><day>2</day><volume>10</volume><fpage>e68714</fpage><pub-id pub-id-type="doi">10.7554/eLife.68714</pub-id><pub-id pub-id-type="medline">34338636</pub-id></nlm-citation></ref><ref id="ref83"><label>83</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>R</given-names> </name><name name-style="western"><surname>Schyman</surname><given-names>P</given-names> </name><name name-style="western"><surname>Wallqvist</surname><given-names>A</given-names> </name></person-group><article-title>Deep neural network models for predicting chemically induced liver toxicity endpoints from transcriptomic responses</article-title><source>Front Pharmacol</source><year>2019</year><volume>10</volume><fpage>30804783</fpage><pub-id pub-id-type="doi">10.3389/fphar.2019.00042</pub-id></nlm-citation></ref><ref id="ref84"><label>84</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Su</surname><given-names>R</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Wei</surname><given-names>L</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>S</given-names> </name><name name-style="western"><surname>Zou</surname><given-names>Q</given-names> </name></person-group><article-title>A multi-label learning model for predicting drug-induced pathology in multi-organ based on toxicogenomics data</article-title><source>PLOS Comput Biol</source><year>2022</year><month>09</month><volume>18</volume><issue>9</issue><fpage>e1010402</fpage><pub-id pub-id-type="doi">10.1371/journal.pcbi.1010402</pub-id><pub-id pub-id-type="medline">36070305</pub-id></nlm-citation></ref><ref id="ref85"><label>85</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chang</surname><given-names>WT</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>CF</given-names> </name><name name-style="western"><surname>Feng</surname><given-names>YH</given-names> </name><etal/></person-group><article-title>An artificial intelligence approach for predicting cardiotoxicity in breast cancer patients receiving anthracycline</article-title><source>Arch Toxicol</source><year>2022</year><month>10</month><volume>96</volume><issue>10</issue><fpage>2731</fpage><lpage>2737</lpage><pub-id pub-id-type="doi">10.1007/s00204-022-03341-y</pub-id><pub-id pub-id-type="medline">35876889</pub-id></nlm-citation></ref><ref id="ref86"><label>86</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Long</surname><given-names>TZ</given-names> </name><name name-style="western"><surname>Shi</surname><given-names>SH</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Structural analysis and prediction of hematotoxicity using deep learning approaches</article-title><source>J Chem Inf Model</source><year>2023</year><month>01</month><day>9</day><volume>63</volume><issue>1</issue><fpage>111</fpage><lpage>125</lpage><pub-id pub-id-type="doi">10.1021/acs.jcim.2c01088</pub-id><pub-id pub-id-type="medline">36472475</pub-id></nlm-citation></ref><ref id="ref87"><label>87</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gorelick</surname><given-names>FS</given-names> </name><name name-style="western"><surname>Lerch</surname><given-names>MM</given-names> </name></person-group><article-title>Do animal models of acute pancreatitis reproduce human disease?</article-title><source>Cell Mol Gastroenterol Hepatol</source><year>2017</year><month>09</month><volume>4</volume><issue>2</issue><fpage>251</fpage><lpage>262</lpage><pub-id pub-id-type="doi">10.1016/j.jcmgh.2017.05.007</pub-id><pub-id pub-id-type="medline">28752114</pub-id></nlm-citation></ref><ref id="ref88"><label>88</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>H</given-names> </name></person-group><article-title>Modeling neurological diseases with human brain organoids</article-title><source>Front Synaptic Neurosci</source><year>2018</year><volume>10</volume><fpage>15</fpage><pub-id pub-id-type="doi">10.3389/fnsyn.2018.00015</pub-id><pub-id pub-id-type="medline">29937727</pub-id></nlm-citation></ref><ref id="ref89"><label>89</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chekroud</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Hawrilenko</surname><given-names>M</given-names> </name><name name-style="western"><surname>Loho</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Illusory generalizability of clinical prediction models</article-title><source>Science</source><year>2024</year><month>01</month><day>12</day><volume>383</volume><issue>6679</issue><fpage>164</fpage><lpage>167</lpage><pub-id pub-id-type="doi">10.1126/science.adg8538</pub-id><pub-id pub-id-type="medline">38207039</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Checklist 1</label><p>PRISMA-ScR checklist.</p><media xlink:href="ai_v5i1e77732_app1.docx" xlink:title="DOCX File, 30 KB"/></supplementary-material></app-group></back></article>