<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR AI</journal-id>
      <journal-title>JMIR AI</journal-title>
      <issn pub-type="epub">2817-1705</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v3i1e50800</article-id>
      <article-id pub-id-type="pmid">39073872</article-id>
      <article-id pub-id-type="doi">10.2196/50800</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Optimizing Clinical Trial Eligibility Design Using Natural Language Processing Models and Real-World Data: Algorithm Development and Validation</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>El Emam</surname>
            <given-names>Khaled</given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Malin</surname>
            <given-names>Bradley</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Khursheed</surname>
            <given-names>Mohammad Omar</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Chrimes</surname>
            <given-names>Dillon</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Han</surname>
            <given-names>Peijin</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Guo</surname>
            <given-names>Lei</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>Kyeryoung</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6937-9931</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Zongzhi</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1578-9967</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Mai</surname>
            <given-names>Yun</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6011-8874</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Jun</surname>
            <given-names>Tomi</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2120-1704</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Ma</surname>
            <given-names>Meng</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0212-298X</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Tongyu</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0008-6618-3088</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Ai</surname>
            <given-names>Lei</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2802-5774</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Calay</surname>
            <given-names>Ediz</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6225-7598</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Oh</surname>
            <given-names>William</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5113-8147</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Stolovitzky</surname>
            <given-names>Gustavo</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9618-2819</ext-link>
        </contrib>
        <contrib id="contrib11" contrib-type="author">
          <name name-style="western">
            <surname>Schadt</surname>
            <given-names>Eric</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7892-8808</ext-link>
        </contrib>
        <contrib id="contrib12" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Xiaoyan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>GendDx (Sema4)</institution>
            <addr-line>333 Ludlow Street</addr-line>
            <addr-line>Stamford, CT, 06902</addr-line>
            <country>United States</country>
            <phone>1 (844) 241 1233</phone>
            <email>xw108@caa.columbia.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4193-4120</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>GendDx (Sema4)</institution>
        <addr-line>Stamford, CT</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Icahn School of Medicine at Mount Sinai</institution>
        <addr-line>New York, NY</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Xiaoyan Wang <email>xw108@caa.columbia.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>29</day>
        <month>7</month>
        <year>2024</year>
      </pub-date>
      <volume>3</volume>
      <elocation-id>e50800</elocation-id>
      <history>
        <date date-type="received">
          <day>16</day>
          <month>7</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>18</day>
          <month>10</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>7</day>
          <month>11</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>23</day>
          <month>3</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Kyeryoung Lee, Zongzhi Liu, Yun Mai, Tomi Jun, Meng Ma, Tongyu Wang, Lei Ai, Ediz Calay, William Oh, Gustavo Stolovitzky, Eric Schadt, Xiaoyan Wang. Originally published in JMIR AI (https://ai.jmir.org), 29.07.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR AI, is properly cited. The complete bibliographic information, a link to the original publication on https://www.ai.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://ai.jmir.org/2024/1/e50800" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Clinical trials are vital for developing new therapies but can also delay drug development. Efficient trial data management, optimized trial protocol, and accurate patient identification are critical for reducing trial timelines. Natural language processing (NLP) has the potential to achieve these objectives.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aims to assess the feasibility of using data-driven approaches to optimize clinical trial protocol design and identify eligible patients. This involves creating a comprehensive eligibility criteria knowledge base integrated within electronic health records using deep learning–based NLP techniques.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We obtained data of 3281 industry-sponsored phase 2 or 3 interventional clinical trials recruiting patients with non–small cell lung cancer, prostate cancer, breast cancer, multiple myeloma, ulcerative colitis, and Crohn disease from ClinicalTrials.gov, spanning the period between 2013 and 2020. A customized bidirectional long short-term memory– and conditional random field–based NLP pipeline was used to extract all eligibility criteria attributes and convert hypernym concepts into computable hyponyms along with their corresponding values. To illustrate the simulation of clinical trial design for optimization purposes, we selected a subset of patients with non–small cell lung cancer (n=2775), curated from the Mount Sinai Health System, as a pilot study.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>We manually annotated the clinical trial eligibility corpus (485/3281, 14.78% trials) and constructed an eligibility criteria–specific ontology. Our customized NLP pipeline, developed based on the eligibility criteria–specific ontology that we created through manual annotation, achieved high precision (0.91, range 0.67-1.00) and recall (0.79, range 0.50-1) scores, as well as a high <italic>F</italic><sub>1</sub>-score (0.83, range 0.67-1), enabling the efficient extraction of granular criteria entities and relevant attributes from 3281 clinical trials. A standardized eligibility criteria knowledge base, compatible with electronic health records, was developed by transforming hypernym concepts into machine-interpretable hyponyms along with their corresponding values. In addition, an interface prototype demonstrated the practicality of leveraging real-world data for optimizing clinical trial protocols and identifying eligible patients.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our customized NLP pipeline successfully generated a standardized eligibility criteria knowledge base by transforming hypernym criteria into machine-readable hyponyms along with their corresponding values. A prototype interface integrating real-world patient information allows us to assess the impact of each eligibility criterion on the number of patients eligible for the trial. Leveraging NLP and real-world data in a data-driven approach holds promise for streamlining the overall clinical trial process, optimizing processes, and improving efficiency in patient identification.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>natural language processing</kwd>
        <kwd>real-world data</kwd>
        <kwd>clinical trial eligibility criteria</kwd>
        <kwd>eligibility criteria–specific ontology</kwd>
        <kwd>clinical trial protocol optimization</kwd>
        <kwd>data-driven approach</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Clinical trials are crucial for developing new therapies, but they require significant resources and can introduce delays in drug development, leading to increased costs [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. Complex and restrictive eligibility criteria hinder patient enrollment, impacting target goals, timelines, and ultimately patient well-being [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref5">5</xref>]. This issue is particularly notable in cancer trials with poor recruitment and high failure rates [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>] because &gt;80% of the trials fail to meet their initial target accruals and timelines [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. In addition, overly restrictive eligibility criteria limit the representation of the broader patient population, reducing real-world applicability and treatment impact [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref13">13</xref>]. Nonetheless, the practice of trials reusing complicated eligibility criteria without a clear rationale is a common one [<xref ref-type="bibr" rid="ref14">14</xref>], despite the minimal impact on trial outcomes [<xref ref-type="bibr" rid="ref15">15</xref>]. Liu et al [<xref ref-type="bibr" rid="ref15">15</xref>] demonstrated that broadening eligibility criteria using a data-driven approach can benefit initially excluded patients. A comprehensive and standardized eligibility criteria knowledge base that is compatible with real-world data can address these challenges. Such a knowledge base optimizes trial protocol design, improves patient enrollment, enhances the reliability and applicability of evidence synthesis, and fosters the efficient development of new therapies. Furthermore, it enables opportunities such as generating synthetic control arms (SCAs) for single-arm clinical trials using electronic health records (EHRs) [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref18">18</xref>].</p>
        <p>The importance of semantically representing eligibility criteria interoperable with EHRs has been highlighted in multiple studies [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref21">21</xref>]. Converting free-text eligibility criteria to computable formats poses challenges, addressed by a range of natural language processing (NLP) techniques and transformer models [<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref26">26</xref>]. An NLP interface, Criteria2Query, enables computable queries for eligible cohort identification using EHRs [<xref ref-type="bibr" rid="ref27">27</xref>]. This tool supports clinical trial knowledge base development, enhancing EHR interoperability and scalability for efficient eligibility criteria knowledge engineering [<xref ref-type="bibr" rid="ref28">28</xref>]. Manually annotated data sets such as “Chia, a large annotated corpus of clinical trial eligibility criteria” [<xref ref-type="bibr" rid="ref29">29</xref>] and the “Leaf Clinical Trials corpus, the largest and most comprehensive human-annotated corpus of publicly available clinical trials eligibility criteria” [<xref ref-type="bibr" rid="ref30">30</xref>] have significantly enhanced NLP model training and the development of effective query structures. Despite significant progress in bridging the gap between eligibility criteria and EHRs, limitations persist in accurately representing the granularities of eligibility criteria and real-time eligible patient number checks [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. Using varying hierarchical levels of medical concepts, whether as hypernyms or hyponyms, presents one of the challenges when aligning eligibility criteria with EHRs; for instance, numerous trial eligibility criteria use hypernyms, which encompass a group of related medical concepts, such as <italic>cardiovascular disease</italic>. Conversely, the patient problem list within the EHR specifies particular medical conditions or diseases (hyponyms), such as <italic>myocardial infarction</italic>. Establishing a standardized eligibility criteria knowledge base by transforming ambiguous hypernym concepts into computable hyponyms can enhance optimizing trial protocol design and identifying eligible patients through seamless integration with EHR data.</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>In this study, we aim to create a standardized eligibility criteria knowledge base that seamlessly integrates with EHRs. By using deep learning–based NLP techniques, hypernym concepts in eligibility criteria will be converted to their EHR-compatible hyponyms along with their corresponding values. In addition, the prototype user interface will be developed as a pilot study, enabling the data-driven optimization of clinical trial protocols and the identification of eligible patients through the integration of the eligibility criteria knowledge base and EHRs.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Set</title>
        <p>We obtained the data from ClinicalTrials.gov, specifically industry-sponsored phase 2 or 3 interventional clinical trials initiated between January 2013 and May 2020. A total of 3281 trials were identified: 817 (24.9%) for non–small cell lung cancer (NSCLC), 649 (19.78%) for prostate cancer (PCa), 1057 (32.22%) for breast cancer (BCa), 447 (13.62%) for multiple myeloma (MM), 160 (4.88%) for ulcerative colitis (UC), and 151 (4.6%) for Crohn disease (CD).</p>
        <p>For the development of the prototype interface, we selected a subgroup of patients (n=2775) diagnosed with NSCLC from a previously curated cohort of patients with lung cancer. This cohort was established using the data from Mount Sinai-Sema4 Health System data [<xref ref-type="bibr" rid="ref33">33</xref>], and patient information was deidentified for the purposes of this study.</p>
      </sec>
      <sec>
        <title>Deep Learning–Based NLP Pipeline Development</title>
        <p>Our NLP pipeline consists of 3 modules: ontology construction and manual annotation, model training and pipeline evaluation, and application.</p>
        <sec>
          <title>Ontology Construction and Manual Annotation</title>
          <p>To construct our ontology, we randomly selected 425 eligibility criteria from diverse cancer trials and manually analyzed entities and relations. This manual analysis focused on identifying entities and their relationships. Entities were subsequently categorized into primary and modifier groups, with detailed examples provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendices 1</xref> and <xref ref-type="supplementary-material" rid="app2">2</xref>. The primary groups included <italic>demographic</italic>, <italic>diagnosis</italic>, <italic>biomarker</italic>, <italic>disease status</italic>, <italic>prior therapy</italic>, <italic>comorbidity</italic>, <italic>laboratory test</italic>, <italic>vital</italic>, <italic>procedure</italic>, and <italic>other medication</italic>, while the modifier groups included <italic>value</italic>, <italic>condition</italic>, <italic>evidence</italic>, <italic>lines of therapy</italic>, <italic>negation</italic>, <italic>exception</italic>, <italic>grade</italic>, <italic>dose</italic>, and <italic>temporal</italic>. Any entities that did not fall into the primary groups were classified as <italic>other observation</italic>. Furthermore, we defined relations between the entities. The commonly detected relationships between the <italic>primary</italic> and <italic>modifier</italic> groups were (1) <italic>has_value_limit</italic> between <italic>demographic (age) or vital lorlaboratory test</italic> and <italic>value</italic>, (2) <italic>has temporal limit</italic> between <italic>comorbidity or other medication or procedure</italic> and <italic>temporal</italic>, (3) <italic>has_negation</italic> between <italic>observation or biomarker or prior therapy</italic> and <italic>negation,</italic> and (4) <italic>has_exception</italic> between <italic>comorbidities or biomarker or diagnosis</italic> and <italic>exception.</italic> Other relationships included <italic>has_dose limit</italic>, <italic>has_line of therapy limit</italic>, <italic>has_grade_limit</italic>, <italic>has_condition</italic>, and <italic>need_evidence</italic>. The applicability of the ontology was tested on 60 UC and CD trials. Next, we manually annotated 246 eligibility criteria from NSCLC trials and performed model training using Clinical Language Annotation, Modeling, and Processing, which is an NLP toolkit [<xref ref-type="bibr" rid="ref34">34</xref>].</p>
        </sec>
        <sec>
          <title>Model Training and Pipeline Evaluation</title>
          <p>A multilayer deep learning architecture was implemented for NLP modeling. The first step involved transforming the text into sequential vectors of characterization during the embedding process. These vectors were subsequently input into a bidirectional long short-term memory network, which is an artificial neural network designed for text classification. The bidirectional long short-term memory network was used to recognize patterns in both forward and backward directions [<xref ref-type="bibr" rid="ref35">35</xref>]. The identified patterns were then passed to the next layer, which used a conditional random field model to compute the prediction probability [<xref ref-type="bibr" rid="ref36">36</xref>]. The NLP model was trained using annotated criteria, with 80% of the manually annotated gold standard data allocated for training. Model performance was evaluated on a separate validation set (20%) using precision, recall, and <italic>F</italic><sub>1</sub>-score values:</p>
          <p>
            <disp-formula>Precision = TP / (TP + FP) <bold>(1)</bold></disp-formula>
          </p>
          <p>
            <disp-formula>Recall = TP / (TP + FN) <bold>(2)</bold></disp-formula>
          </p>
          <p>
            <disp-formula><italic>F</italic><sub>1</sub>-score = 2 × (Precision × Recall) / (Precision + Recall) <bold>(3)</bold></disp-formula>
          </p>
          <p>In equations 1 and 2, TP stands for true positives, FP for false positives, and FN for false negatives.</p>
          <p>The manual annotation and training processes were iteratively performed with additional manually annotated notes until the model achieved a <italic>F<sub>1</sub></italic>-score of &gt;0.8 in the test set (<xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>). To tailor the pipeline for specific cancer types, a preannotation method using the NSCLC pipeline was implemented for PCa, BCa, and MM for common eligibility criteria such as laboratory test values and comorbidities. Specific eligibility criteria such as biomarkers and treatments were manually annotated for each cancer type: PCa with 124 trials, BCa with 73 trials, and MM with 60 trials.</p>
        </sec>
        <sec>
          <title>Application</title>
          <p>The fully trained named entity recognition and relation models were integrated and applied to annotate the remaining eligibility criteria for the 4 types of cancer studied (BCa, MM, NSCLC, and PCa). The output data included sentences, tokens, parts of speech, entities, negations, and relations.</p>
        </sec>
      </sec>
      <sec>
        <title>Construction of Standardized Eligibility Criteria Knowledge Base Table</title>
        <p>The standardized knowledge base was constructed in an <italic>EntityGroup-AttributeName-Value</italic> format, involving 2 key steps: attribute normalization and transforming hypernyms to hyponyms with corresponding values.</p>
        <sec>
          <title>Attribute Normalization</title>
          <p>To normalize attributes, we used a 3-step approach. First, we assigned a Unified Medical Language System concept unique identifier to map synonyms of an entity, such as <italic>estrogen receptor-positive</italic>, <italic>ER-positive</italic>, and <italic>ER+</italic> to the Unified Medical Language System concept unique identifier <italic>C0279754</italic>. Second, we developed a set of rules (<xref ref-type="table" rid="table1">Table 1</xref>) to map abbreviations (eg, <italic>CrCl</italic> to <italic>creatinine clearance</italic>) and different phrases with the same meaning (eg, ≥<italic>1.5x ULN</italic> [where <italic>ULN</italic> stands for <italic>upper limit of normal</italic>], <italic>greater than or equal to 1.5x ULN</italic>, and ≥<italic>1.5x upper limit of normal</italic>) back to their original text. Finally, 2 domain experts manually curated unnormalized entities.</p>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Rules for attribute normalization.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="670"/>
              <col width="0"/>
              <col width="300"/>
              <thead>
                <tr valign="top">
                  <td colspan="3">Rule and attributes from eligibility criteria</td>
                  <td>Normalized attributes</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="4">
                    <bold>Rules for mapping synonyms</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>AST<sup>a</sup>, SGOT<sup>b</sup>, aspartate aminotransferase, serum AST</td>
                  <td colspan="2">AST</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ALT<sup>c</sup>, SGPT<sup>d</sup>, alanine aminotransferase, serum ALT</td>
                  <td colspan="2">ALT</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Total bilirubin, serum bilirubin, total bilirubin level, bilirubin level</td>
                  <td colspan="2">Total bilirubin</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Hgb<sup>e</sup>, hemoglobin</td>
                  <td colspan="2">Hgb</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>HbA<sub>1c</sub><sup>f</sup>, hemoglobinA<sub>1c</sub></td>
                  <td colspan="2">HbA<sub>1c</sub></td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>serum creatinine, creatinine, creatinine levels, creatinine level</td>
                  <td colspan="2">Serum creatinine</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ANC<sup>g</sup>, absolute neutrophil count, absolute neutrophil counts, neutrophil count, neutrophil counts, absolute neutrophil</td>
                  <td colspan="2">ANC</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>WBC<sup>h</sup>, white blood cells, white blood cell, WBC count, white blood cell count, white blood count, leucocytes</td>
                  <td colspan="2">WBC</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>platelets, platelet, platelet count, platelet counts</td>
                  <td colspan="2">Platelets</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>CrCl<sup>i</sup>, creatine clearance</td>
                  <td colspan="2">CrCl</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ALP<sup>j</sup>, alkaline phosphatase</td>
                  <td colspan="2">ALP</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ULN<sup>k</sup>, upper limit of normal</td>
                  <td colspan="2">ULN</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>LLN<sup>l</sup>, lower limit of normal</td>
                  <td colspan="2">LLN</td>
                </tr>
                <tr valign="top">
                  <td colspan="4">
                    <bold>Rules related to unit and temporal modifier</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>less than or equal to, ≤</td>
                  <td colspan="2">≤</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>greater than or equal to, ≥</td>
                  <td colspan="2">≥</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>greater than, &gt;</td>
                  <td colspan="2">&gt;</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>less than, &lt;</td>
                  <td colspan="2">&lt;</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>within 4 weeks, within 28 days</td>
                  <td colspan="2">within 4 weeks</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>within 2 weeks, within 14 days</td>
                  <td colspan="2">within 2 weeks</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>within 3 weeks, within 21 days</td>
                  <td colspan="2">within 3 weeks</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>last 6 months, past 6 months, within 6 months, within six months</td>
                  <td colspan="2">within 6 months</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>last 3 months, past 3 months, within 3 months, within three months</td>
                  <td colspan="2">within 3 months</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>within 2 years, last 2 years, past 2 years</td>
                  <td colspan="2">within 2 years</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>within 3 years, last 3 years, past 3 years</td>
                  <td colspan="2">within 3 years</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>within 5 years, last 5 years, past 5 years</td>
                  <td colspan="2">within 5 years</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>10<sup>9</sup>/L, 10<sup>9</sup>/L, 10<sup>3</sup>/uL, 10<sup>3</sup>/microliter, 1000/uL, 1000/microliter, K/microliter, 10<sup>3</sup>/mm<sup>3</sup></td>
                  <td colspan="2">10<sup>3</sup>/uL</td>
                </tr>
                <tr valign="top">
                  <td colspan="4">
                    <bold>Other miscellaneous rules</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Case insensitive</td>
                  <td colspan="2">—<sup>m</sup></td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Remove spaces</td>
                  <td colspan="2"> —</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table1fn1">
                <p><sup>a</sup>AST: aspartate aminotransferase.</p>
              </fn>
              <fn id="table1fn2">
                <p><sup>b</sup>SGOT: serum glutamic oxaloacetic transaminase.</p>
              </fn>
              <fn id="table1fn3">
                <p><sup>c</sup>ALT: alanine transaminase.</p>
              </fn>
              <fn id="table1fn4">
                <p><sup>d</sup>SGPT: serum glutamic pyruvic transaminase.</p>
              </fn>
              <fn id="table1fn5">
                <p><sup>e</sup>Hgb: hemoglobin.</p>
              </fn>
              <fn id="table1fn6">
                <p><sup>f</sup>HbA<sub>1c</sub>: glycated hemoglobin.</p>
              </fn>
              <fn id="table1fn7">
                <p><sup>g</sup>ANC: absolute neutrophil count.</p>
              </fn>
              <fn id="table1fn8">
                <p><sup>h</sup>WBC: white blood cell.</p>
              </fn>
              <fn id="table1fn9">
                <p><sup>i</sup>CrCl: creatinine clearance.</p>
              </fn>
              <fn id="table1fn10">
                <p><sup>j</sup>ALP: alkaline phosphatase.</p>
              </fn>
              <fn id="table1fn11">
                <p><sup>k</sup>ULN: upper limit of normal.</p>
              </fn>
              <fn id="table1fn12">
                <p><sup>l</sup>LLN: lower limit of normal.</p>
              </fn>
              <fn id="table1fn13">
                <p><sup>m</sup>Not applicable.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
        <sec>
          <title>Transforming Hypernyms to Hyponyms Along With Corresponding Values</title>
          <p>To formalize hypernyms, identified in primary groups such as <italic>laboratory test</italic>, <italic>comorbidity</italic>, biomarker, <italic>prior therapy</italic>, and <italic>other medication</italic>, we used the following approaches: (1) for <italic>adequate organ function</italic> <italic>laboratory test</italic> values, we determined prevalent laboratory test values by analyzing the unique laboratory test values for each test across the trials of the same cancer type that defined the normal organ function; and (2) for <italic>comorbidity</italic>, <italic>biomarker</italic>, <italic>prior therapy</italic>, and <italic>other medication</italic> hypernyms, we collected all example hyponyms described across the trials of the same cancer type.</p>
        </sec>
      </sec>
      <sec>
        <title>Creation of a Prototype Interface for Enhancing Trial Protocol Design Optimization</title>
        <p>We developed a prototype interface using the R programming language (R Foundation for Statistical Computing) and the <italic>Shiny</italic> package to enhance trial protocol design optimization. The interface allows users to simulate the number of eligible patients based on specific criteria, including a combination of criteria such as histology, stages, laboratory test values, performance scores, prior line of therapy, and comorbidities. For this pilot study, a subset of patients with NSCLC (n=2775) was selected and deidentified. To ensure consistency and accuracy, we standardized the sample entities found in both the eligibility criteria knowledge base and EHRs using concept codes such as the <italic>International Classification of Diseases</italic>; Logical Observation Identifiers, Names, and Codes (LOINC); and normalized medical prescription codes. In addition, we converted the patients’ absolute laboratory test values to either the upper limit of normal (ULN) or the lower limit of normal based on the provided normal ranges for each specific test. <xref ref-type="table" rid="table2">Tables 2</xref> and <xref ref-type="table" rid="table3">3</xref> and <xref ref-type="boxed-text" rid="box1">Textbox 1</xref> present some examples of normalized concepts and their codes.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Examples of normalized codes for each concept and normal range of each laboratory test.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="250"/>
            <col width="250"/>
            <thead>
              <tr valign="bottom">
                <td>Laboratory test</td>
                <td>LOINC<sup>a</sup> code</td>
                <td>Normal range</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>ALT<sup>b</sup> (SGPT<sup>c</sup>; U/L)</td>
                <td>1742-6</td>
                <td>7-56</td>
              </tr>
              <tr valign="top">
                <td>AST<sup>d</sup> (SGOT<sup>e</sup>; U/L)</td>
                <td>1920-8</td>
                <td>10-40</td>
              </tr>
              <tr valign="top">
                <td>Total bilirubin in serum (mg/dL)</td>
                <td>1975-2</td>
                <td>0.1-1.2</td>
              </tr>
              <tr valign="top">
                <td>Direct (conjugated) bilirubin in serum (mg/dL)</td>
                <td>1968-7</td>
                <td>&lt;0.3</td>
              </tr>
              <tr valign="top">
                <td>Serum creatinine (mg/dL)</td>
                <td>2160-0</td>
                <td>0.6-1.2 (male), 0.5-1.1 (female)</td>
              </tr>
              <tr valign="top">
                <td>CrCl<sup>f</sup> (mL/min)</td>
                <td>2164-2</td>
                <td>97-137 (male), 88-128 (female)</td>
              </tr>
              <tr valign="top">
                <td>ANC<sup>g</sup> (cells/µL)</td>
                <td>26499-4</td>
                <td>&gt;90 mL/min/1.73 m<sup>2</sup></td>
              </tr>
              <tr valign="top">
                <td>Platelets (cells/µL)</td>
                <td>777-3</td>
                <td>150,000-450,000</td>
              </tr>
              <tr valign="top">
                <td>Hemoglobin (g/dL)</td>
                <td>718-7</td>
                <td>12-18</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>LOINC: Logical Observation Identifiers, Names, and Codes.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>ALT: alanine transaminase.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>SGPT: serum glutamic pyruvic transaminase.</p>
            </fn>
            <fn id="table2fn4">
              <p><sup>d</sup>AST: aspartate aminotransferase.</p>
            </fn>
            <fn id="table2fn5">
              <p><sup>e</sup>SGOT: serum glutamic oxaloacetic transaminase.</p>
            </fn>
            <fn id="table2fn6">
              <p><sup>f</sup>CrCl: creatinine clearance.</p>
            </fn>
            <fn id="table2fn7">
              <p><sup>g</sup>ANC: absolute neutrophil count.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Examples of International Classification of Diseases, Tenth Revision (ICD-10), and International Classification of Diseases, Ninth Revision (ICD-9), disease codes.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="250"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td>Disease</td>
                <td><italic>ICD-10</italic> codes</td>
                <td><italic>ICD-9</italic> codes</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Congestive heart failure</td>
                <td>I50.2, I50.3, I50.4</td>
                <td>428.[2-4][0-3]</td>
              </tr>
              <tr valign="top">
                <td>Unstable angina</td>
                <td>I20.0</td>
                <td>411.1</td>
              </tr>
              <tr valign="top">
                <td>Acute myocardial infarction</td>
                <td>I21</td>
                <td>410.9[0-2]</td>
              </tr>
              <tr valign="top">
                <td>Arrythmia</td>
                <td>I49</td>
                <td>429.9</td>
              </tr>
              <tr valign="top">
                <td>Torsade de pointes</td>
                <td>I45.81</td>
                <td>426.82</td>
              </tr>
              <tr valign="top">
                <td>Long QT syndrome</td>
                <td>I45.81</td>
                <td>426.82</td>
              </tr>
              <tr valign="top">
                <td>Atrial fibrillation and flutter</td>
                <td>I48</td>
                <td>427.3[1-2]</td>
              </tr>
              <tr valign="top">
                <td>Symptomatic bradycardia</td>
                <td>R00.1</td>
                <td>427.89</td>
              </tr>
              <tr valign="top">
                <td>Uncontrolled hypertension</td>
                <td>I10</td>
                <td>401.[09]</td>
              </tr>
              <tr valign="top">
                <td>Heart aneurysm</td>
                <td>I25.3</td>
                <td>414.1[09]</td>
              </tr>
              <tr valign="top">
                <td>Coronary heart disease</td>
                <td>I25.1</td>
                <td>414.01</td>
              </tr>
              <tr valign="top">
                <td>Cardiomyopathy</td>
                <td>I42.9</td>
                <td>425.[49­]</td>
              </tr>
              <tr valign="top">
                <td>Vasculitis, or angiitis</td>
                <td>I77.6</td>
                <td>447.6</td>
              </tr>
              <tr valign="top">
                <td>Pericardial effusion</td>
                <td>I31.3</td>
                <td>423.9</td>
              </tr>
              <tr valign="top">
                <td>Peripheral vascular disease</td>
                <td>I73.9</td>
                <td>443.9</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <boxed-text id="box1" position="float">
          <title>Examples of normalized medical prescription (RxNORM) drug codes.</title>
          <p>
            <bold>Drug and RxNORM code</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>Bortezomib: 356733</p>
            </list-item>
            <list-item>
              <p>Carfilzomib: 1302966</p>
            </list-item>
            <list-item>
              <p>Ixazomib: 1723735</p>
            </list-item>
            <list-item>
              <p>Lenalidomide: 342369</p>
            </list-item>
            <list-item>
              <p>Pomalidomide: 1369713</p>
            </list-item>
          </list>
        </boxed-text>
        <p>The interface uses a rule-based algorithm to match patients’ EHR data with the criteria. The comprehensive rules for matching EHR data with criteria have been described in our previous studies [<xref ref-type="bibr" rid="ref37">37</xref>]; for instance, we defined the following rules to map each laboratory test in EHRs to 1 corresponding LOINC code:</p>
        <list list-type="order">
          <list-item>
            <p>Mapping the laboratory test in the LOINC dictionary to the laboratory test in the EHR, based on the popularity rank available in the LOINC dictionary</p>
          </list-item>
          <list-item>
            <p>Mapping the laboratory test for serum or plasma samples in the LOINC dictionary to the laboratory test in the EHR when the popularity rank is not available in the LOINC dictionary</p>
          </list-item>
          <list-item>
            <p>If one-to-one mapping is not feasible using rule 1 and rule 2, the test unit (eg, <italic>gram</italic> is preferred ove<italic>molar</italic>) is considered to facilitate the mapping</p>
          </list-item>
          <list-item>
            <p>When one-to-one mapping is not attainable using rule 1, rule 2, and rule 3, preference is given to the laboratory test that lacks information about the method for mapping</p>
          </list-item>
        </list>
        <p>We associated medication classes with their respective medications; for instance, we extended the annotation “post-menopausal not older than 60 years and taking LHRH [luteinizing hormone–releasing hormone] agonist” to include “post-menopausal not older than 60 years and taking goserelin, leuprolide, or other LHRH agonists.” To achieve this, we used both our in-house knowledge bases and standard resources, such as the National Comprehensive Cancer Network’s Clinical Practice Guidelines in Oncology.</p>
        <p>Users can specify different criteria and combinations, such as different laboratory test values with specific conditions such as <italic>no brain metastasis</italic> to determine the number of qualified patients. The algorithm matches each patient’s EHR data with the selected criteria and calculates the number of matched patients for each criterion. The performance of the interface was evaluated by comparing it to the manual patient selection process conducted by experienced clinical domain experts.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>This study was confirmed and approved by the Program for the Protection of Human Subjects at the Mount Sinai School of Medicine (IRB-17-01245)</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Development of Eligibility Criteria–Specific Ontology</title>
        <p>Our analysis of cancer clinical trials revealed that hormone therapy was the most frequently applied modality (1470/2970, 47.37%), primarily in BCa and PCa trials, followed by targeted therapy (753/2970, 25.35%) and immunotherapy (691/2970, 23.26%). Chemotherapy alone was used in 3.8% (113/2970) of the clinical trials. We developed an eligibility criteria ontology applicable to all cancer trials by manually analyzing 425 eligibility criteria (<xref rid="figure1" ref-type="fig">Figure 1</xref>). Entities were categorized into 10 primary groups (inside the blue dotted box) and 9 modifier groups based on semantic types and relations. Entities falling outside the blue dotted box were classified as <italic>other observation</italic>. The inclusion criteria mainly involved entities in the <italic>demographic</italic>, <italic>diagnosis</italic>, <italic>laboratory test</italic>, and <italic>vital</italic> groups, while the exclusion criteria commonly included entities in the <italic>comorbidity</italic>, <italic>procedure</italic>, and <italic>other medication</italic> groups. Entities in the <italic>biomarker</italic>, <italic>prior therapy</italic>, and <italic>disease status</italic> groups appeared in both the inclusion and exclusion criteria. Relationships originated from the primary groups and terminated in the modifier groups, except for the <italic>has outcome</italic> relationship, which started and ended in the primary group (<xref rid="figure1" ref-type="fig">Figure 1</xref>). To assess the applicability of the cancer eligibility criteria ontology in a different disease context, we conducted a manual analysis of 60 trials related to UC and CD. For reference, the computable formats of the manually annotated 485 trials can be found in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendices 4</xref>-<xref ref-type="supplementary-material" rid="app8">8</xref>.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Clinical trial eligibility criteria ontology. Primary entities are grouped inside the blue dotted box. Modifier entities are placed outside the blue dotted box. The relationship between the primary entities and modifier entities always starts at a primary entity and ends at a modifier entity. LOT: line of therapy.</p>
          </caption>
          <graphic xlink:href="ai_v3i1e50800_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>NLP Pipeline Quality Metrics</title>
        <p>To evaluate the quality of our NLP pipeline, we computed precision, recall, and <italic>F</italic><sub>1</sub>-score measures. For the primary group entities, the average scores were 0.91 (precision), 0.79 (recall), and 0.83 (<italic>F</italic><sub>1</sub>-score). <xref ref-type="table" rid="table4">Table 4</xref> presents the range of precision, recall, and <italic>F</italic><sub>1</sub>-score values of 17 primary group entities.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Performance scores of customized natural language processing pipeline for each entity in the primary groups.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="470"/>
            <col width="0"/>
            <col width="200"/>
            <col width="0"/>
            <col width="160"/>
            <col width="0"/>
            <col width="140"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Primary group and attribute group::name</td>
                <td colspan="2">Precision</td>
                <td colspan="2">Recall</td>
                <td><italic>F</italic><sub>1</sub>-score</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="8">
                  <bold>Demographic</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Demographic::age</td>
                <td colspan="2">1.000</td>
                <td colspan="2">0.923</td>
                <td colspan="2">0.960</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Demographic::gender</td>
                <td colspan="2">1.000</td>
                <td colspan="2">0.870</td>
                <td colspan="2">0.931</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Diagnosis</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Diagnosis::histology</td>
                <td colspan="2">1.000</td>
                <td colspan="2">1.000</td>
                <td colspan="2">1.000</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Diagnosis::stage</td>
                <td colspan="2">0.667</td>
                <td colspan="2">1.000</td>
                <td colspan="2">0.800</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Biomarker</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Biomarker::biomarker</td>
                <td colspan="2">1.000</td>
                <td colspan="2">0.800</td>
                <td colspan="2">0.889</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Disease status</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Clinical status::disease status</td>
                <td colspan="2">0.737</td>
                <td colspan="2">0.684</td>
                <td colspan="2">0.709</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Prior therapy</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Prior therapy::chemotherapy</td>
                <td colspan="2">0.944</td>
                <td colspan="2">0.895</td>
                <td colspan="2">0.919</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Prior therapy::targeted therapy</td>
                <td colspan="2">1.000</td>
                <td colspan="2">0.786</td>
                <td colspan="2">0.880</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Prior therapy::immunotherapy</td>
                <td colspan="2">0.897</td>
                <td colspan="2">0.788</td>
                <td colspan="2">0.839</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Prior therapy::radiotherapy</td>
                <td colspan="2">0.682</td>
                <td colspan="2">0.682</td>
                <td colspan="2">0.682</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Prior therapy::adjuvant therapy</td>
                <td colspan="2">1.000</td>
                <td colspan="2">0.571</td>
                <td colspan="2">0.727</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Prior therapy::neoadjuvant therapy</td>
                <td colspan="2">1.000</td>
                <td colspan="2">0.500</td>
                <td colspan="2">0.667</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Comorbidity</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Comorbidity::disease</td>
                <td colspan="2">0.842</td>
                <td colspan="2">0.762</td>
                <td colspan="2">0.800</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Laboratory test</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Laboratory test::test</td>
                <td colspan="2">0.871</td>
                <td colspan="2">0.818</td>
                <td colspan="2">0.844</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Vital</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Vital::vital</td>
                <td colspan="2">1.000</td>
                <td colspan="2">1.000</td>
                <td colspan="2">1.000</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Procedure</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Procedure::procedure</td>
                <td colspan="2">1.000</td>
                <td colspan="2">0.600</td>
                <td colspan="2">0.750</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>Other medication</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Other medication::medication</td>
                <td colspan="2">0.800</td>
                <td colspan="2">0.727</td>
                <td colspan="2">0.762</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Eligibility Criteria Attribute Extraction and Classification</title>
        <p>The integrated named entity recognition and relation model extracted 9090 NSCLC, 7427 PCa, 10,217 BCa, 6803 MM, 1565 CD, and 1586 UC entities along with their attribute relations. After normalization and manual curation processes, the eligibility criteria knowledge base for each disease type was established in the <italic>EntityGroup-AttributeName-Value</italic> format (<xref ref-type="supplementary-material" rid="app9">Multimedia Appendices 9</xref>-<xref ref-type="supplementary-material" rid="app14">14</xref>). The number of unique <italic>EntityGroup-AttributeName-Value</italic> combinations varied across disease types, with 494 from 817 NSCLC trials, 471 from 649 PCa trials, 525 from 1057 BCa trials, 389 from 447 MM trials, 231 from 160 UC trials, and 230 from 151 CD trials. Notably, UC and CD trials had a smaller number of unique <italic>EntityGroup-AttributeName-Value</italic> combinations compared to cancer trials, indicating the presence of more complicated eligibility criteria in cancer trials.</p>
        <p><xref rid="figure2" ref-type="fig">Figure 2</xref> and <xref ref-type="table" rid="table5">Table 5</xref> show the distribution of <italic>EntityGroup-AttributeName-Value</italic> combinations in each primary group from different diseases and provide examples. The <italic>laboratory test</italic>, <italic>prior therapy</italic>, and <italic>comorbidity</italic> groups exhibited a high number of <italic>EntityGroup-AttributeName-Value</italic> combinations, followed by the <italic>biomarker</italic> and <italic>other medication</italic> groups. Variations were observed between solid cancers and hematologic cancers, with higher numbers of <italic>EntityGroup-AttributeName-Value</italic> combinations in solid cancer types for <italic>prior therapy</italic> and <italic>biomarker</italic>, while <italic>laboratory test</italic> and <italic>comorbidity</italic> were comparable. The <italic>diagnosis</italic> group exhibited varying numbers of <italic>EntityGroup-AttributeName-Value</italic> combinations across all 4 cancer types (BCa, MM, NSCLC, and PCa). <italic>EntityGroup-AttributeName-Value</italic> in the <italic>biomarker</italic>, <italic>diagnosis</italic>, and <italic>prior therapy</italic> groups were specified per indication, while shared <italic>EntityGroup-AttributeName-Value</italic> were found in other primary groups.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Distribution of attributes in the 10 primary groups as well as the other observation group extracted from the eligibility criteria of 4 different cancer types and 2 different autoimmune diseases. BCa: breast cancer; CD: Crohn disease; MM: multiple myeloma; NSCLC: non–small cell lung cancer; PCa: prostate cancer; UC: ulcerative colitis.</p>
          </caption>
          <graphic xlink:href="ai_v3i1e50800_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>The number of attributes for 10 primary groups along with examples.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="180"/>
            <col width="90"/>
            <col width="70"/>
            <col width="70"/>
            <col width="70"/>
            <col width="0"/>
            <col width="520"/>
            <thead>
              <tr valign="top">
                <td>Primary group</td>
                <td colspan="5">Number of attributes</td>
                <td>Example attributes: group, name, value (with or without condition)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>NSCLC<sup>a</sup></td>
                <td>BCa<sup>b</sup></td>
                <td>PCa<sup>c</sup></td>
                <td>MM<sup>d</sup></td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Demographic</td>
                <td>11</td>
                <td>12</td>
                <td>10</td>
                <td>5</td>
                <td colspan="2">Demographic, age, ≥18 y</td>
              </tr>
              <tr valign="top">
                <td>Diagnosis</td>
                <td>18</td>
                <td>31</td>
                <td>17</td>
                <td>4</td>
                <td colspan="2">Stage, TNM<sup>e</sup> system, T2b<sup>f</sup></td>
              </tr>
              <tr valign="top">
                <td>Biomarker</td>
                <td>49</td>
                <td>72</td>
                <td>42</td>
                <td>14</td>
                <td colspan="2">Biomarker, HER2<sup>g</sup> mutation, L755P<sup>h</sup></td>
              </tr>
              <tr valign="top">
                <td>Disease status</td>
                <td>11</td>
                <td>11</td>
                <td>13</td>
                <td>9</td>
                <td colspan="2">Disease status, relapsed, yes</td>
              </tr>
              <tr valign="top">
                <td>Prior therapy</td>
                <td>114</td>
                <td>108</td>
                <td>93</td>
                <td>50</td>
                <td colspan="2">LOT<sup>i</sup>, prior LOT, ≥2</td>
              </tr>
              <tr valign="top">
                <td>Comorbidity</td>
                <td>105</td>
                <td>96</td>
                <td>97</td>
                <td>108</td>
                <td colspan="2">Cardiovascular disease, arrhythmia, yes (≤3 mo)</td>
              </tr>
              <tr valign="top">
                <td>Laboratory test</td>
                <td>103</td>
                <td>103</td>
                <td>110</td>
                <td>119</td>
                <td colspan="2">Test, AST<sup>j</sup>, ≤2.5x ULN<sup>k</sup></td>
              </tr>
              <tr valign="top">
                <td>Vital</td>
                <td>18</td>
                <td>22</td>
                <td>21</td>
                <td>18</td>
                <td colspan="2">Vital, ECOG<sup>l</sup>, ≥2</td>
              </tr>
              <tr valign="top">
                <td>Procedure</td>
                <td>6</td>
                <td>6</td>
                <td>6</td>
                <td>8</td>
                <td colspan="2">Procedure, organ transplantation, yes</td>
              </tr>
              <tr valign="top">
                <td>Other medication</td>
                <td>45</td>
                <td>45</td>
                <td>45</td>
                <td>46</td>
                <td colspan="2">Other medication, use of anticoagulants, warfarin (&lt;4 wk)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>NSCLC: non–small cell lung cancer.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>BCa: breast cancer.</p>
            </fn>
            <fn id="table5fn3">
              <p><sup>c</sup>PCa: prostate cancer.</p>
            </fn>
            <fn id="table5fn4">
              <p><sup>d</sup>MM: multiple myeloma.</p>
            </fn>
            <fn id="table5fn5">
              <p><sup>e</sup>TNM: tumor, nodes, metastasis.</p>
            </fn>
            <fn id="table5fn6">
              <p><sup>f</sup>T2b: a moderately advanced tumor in terms of size and extent but not the most advanced stage; specific implications can vary based on the type of cancer being described.</p>
            </fn>
            <fn id="table5fn7">
              <p><sup>g</sup>HER2: human epidermal growth factor receptor 2.</p>
            </fn>
            <fn id="table5fn8">
              <p><sup>h</sup>L755P: a reference to a specific mutation in the HER2 gene, with “L” standing for leucine, “755” being the position of the amino acid in the protein, and “P” standing for proline.</p>
            </fn>
            <fn id="table5fn9">
              <p><sup>i</sup>LOT: line of therapy.</p>
            </fn>
            <fn id="table5fn10">
              <p><sup>j</sup>AST: aspartate aminotransferase.</p>
            </fn>
            <fn id="table5fn11">
              <p><sup>k</sup>ULN: upper limit of normal.</p>
            </fn>
            <fn id="table5fn12">
              <p><sup>l</sup>ECOG: Eastern Cooperative Oncology Group.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Transformation of Umbrella Terms Into Computable Attributes With Representative Values</title>
        <sec>
          <title>Overview</title>
          <p>The conversion of hypernym concepts into computable attributes along with their corresponding values was carried out. <xref ref-type="table" rid="table6">Table 6</xref> provides some examples of converted attributes and their corresponding values for each hypernym. All lists can be found in <xref ref-type="supplementary-material" rid="app9">Multimedia Appendices 9</xref>-<xref ref-type="supplementary-material" rid="app14">14</xref>.</p>
          <table-wrap position="float" id="table6">
            <label>Table 6</label>
            <caption>
              <p>Examples of hypernym concepts (entity and subgroup entity in eligibility criteria) used in eligibility criteria and converted hyponyms along with their corresponding values.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="30"/>
              <col width="640"/>
              <col width="0"/>
              <col width="300"/>
              <thead>
                <tr valign="top">
                  <td colspan="4">Entity and subgroup entity in eligibility criteria and converted attribute</td>
                  <td>Corresponding values</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="5">
                    <bold>Adequate organ function</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Normal hepatic function</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>AST<sup>a</sup></td>
                  <td colspan="2">≤2.5x ULN<sup>b</sup></td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>ALT<sup>c</sup></td>
                  <td colspan="2">≤2.5x ULN</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Total bilirubin</td>
                  <td colspan="2">≤1.5x ULN</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Normal renal function</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Creatinine</td>
                  <td colspan="2">≤1.5x ULN</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Normal hematologic function</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>ANC<sup>d</sup></td>
                  <td colspan="2">≥1500 cells/uL</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Platelets</td>
                  <td colspan="2">≥100,000 cells/uL</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Hemoglobin</td>
                  <td colspan="2">≥9 mg/dL</td>
                </tr>
                <tr valign="top">
                  <td colspan="5">
                    <bold>Comorbidities</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Second malignancy</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>All cancers</td>
                  <td colspan="2">Yes, with exceptions</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Infectious disease</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>HIV</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>HBV<sup>e</sup></td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>HCV<sup>f</sup></td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>TB<sup>g</sup></td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Cardiovascular disease</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>CHF<sup>h</sup></td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>MI<sup>i</sup></td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Angina</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Arrhythmia</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Autoimmune disease</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>UC<sup>j</sup></td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>CD<sup>k</sup></td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Systemic lupus erythematosus</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Rheumatoid arthritis</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Systemic sclerosis</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Graves disease</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Guillain-Barré syndrome</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Antiphospholipid syndrome</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Sjogren syndrome</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td colspan="5"> <bold>Biomarker</bold></td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>EGFR<sup>l</sup> mutation sensitive to TKI<sup>m</sup></bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Exon 19 deletion</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Exon 21 L858R</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Exon 21 L861Q</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Exon 18 G719C</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Exon 18 G719X</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Amplification</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>EGFR mutation resistant to TKI</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Exon 20 T790M</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Exon 20 C797S</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Exon 20 S768I</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Exon 20 insertion</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Mismatch repair deficient</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>MSH2, MSH6, MLH1, PMS2, or EXO1 gene mutation</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>MLH1 hypermethylation</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td colspan="5">
                    <bold>Prior therapy (targeted)</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>First-generation EGFR inhibitor</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Gefitinib</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Erlotinib</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Vandetanib</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Second-generation EGFR inhibitor</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Afatinib</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Dacomitinib</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Poziotinib</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Tesevatinib</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Third-generation EGFR inhibitor</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Osimertinib</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Lazertinib</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Rociletinib</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Tarloxotinib</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Proteasome inhibitor</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Bortezomib based</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Carfilzomib based</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Ixazomib based</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Oprozomib based</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td colspan="5">
                    <bold>Prior therapy (hormone)</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>First-generation antiandrogen</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Bicalutamide</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Nilutamide</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Flutamide</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Second-generation antiandrogen</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Abiraterone</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Enzalutamide</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Darolutamide</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Apalutamide</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Androgen deprivation therapy</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Leuprolide</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Goserelin</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Degarelix</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>5-α reducing agent</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Finasteride</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Dutasteride</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Megestrol acetate</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td colspan="5">
                    <bold>Other medication</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Current use of antibiotics</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Rifabutin</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Clarithromycin</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Azithromycin</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Imipenem</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="4">
                    <bold>Current use of antiarrhythmic agents</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td>Propafenone</td>
                  <td colspan="2">Yes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td> </td>
                  <td> Procainamide</td>
                  <td colspan="2">Yes</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table6fn1">
                <p><sup>a</sup>AST: aspartate aminotransferase.</p>
              </fn>
              <fn id="table6fn2">
                <p><sup>b</sup>ULN: upper limit of normal.</p>
              </fn>
              <fn id="table6fn3">
                <p><sup>c</sup>ALT: alanine transaminase.</p>
              </fn>
              <fn id="table6fn4">
                <p><sup>d</sup>ANC: absolute neutrophil count.</p>
              </fn>
              <fn id="table6fn5">
                <p><sup>e</sup>HBV: hepatitis B virus.</p>
              </fn>
              <fn id="table6fn6">
                <p><sup>f</sup>HCV: hepatitis C virus.</p>
              </fn>
              <fn id="table6fn7">
                <p><sup>g</sup>TB: tuberculosis.</p>
              </fn>
              <fn id="table6fn8">
                <p><sup>h</sup>CHF: congestive heart failure.</p>
              </fn>
              <fn id="table6fn9">
                <p><sup>i</sup>MI: myocardial infarction.</p>
              </fn>
              <fn id="table6fn10">
                <p><sup>j</sup>UC: ulcerative colitis.</p>
              </fn>
              <fn id="table6fn11">
                <p><sup>k</sup>CD: Crohn disease.</p>
              </fn>
              <fn id="table6fn12">
                <p><sup>l</sup>EGFR: epidermal growth factor receptor.</p>
              </fn>
              <fn id="table6fn13">
                <p><sup>m</sup>TKI: tyrosine kinase inhibitor.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
        <sec>
          <title>Adequate Organ Function</title>
          <p>Adequate organ function criteria were defined using various laboratory tests. Normal ranges and eligible values for alanine transaminase (ALT)/aspartate aminotransferase (AST), total bilirubin, serum creatinine, creatinine clearance, absolute neutrophil count, platelets, and hemoglobin were determined. Representative values for <italic>adequate organ/hematologic function</italic> included ≤2.5x ULN for ALT/AST, ≤1.5x ULN for total bilirubin/serum creatinine, ≥1500 cells/uL for absolute neutrophil count, ≥100,000 cells/uL for platelets, and ≥9 ng/dL for hemoglobin. <xref rid="figure3" ref-type="fig">Figures 3</xref>A-3H display the laboratory test value range and trial counts for each value in BCa and NSCLC clinical trials. The trends observed are similar in both cancer types.</p>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Clinical trial counts with each unique laboratory test value defining normal organ function. (A-B) Alanine transaminase (ALT) and aspartate aminotransferase (AST): normal ranges from ≤1x upper limit of normal (ULN) to ≤3x ULN, with exceptions for liver diseases (eg, liver metastasis and Gilbert syndrome [GS]) allowing values of up to ≤5x ULN. (C) Total bilirubin: normal ranges from ≤1x ULN to ≤2.5x ULN, with exceptions for liver diseases (eg, liver metastasis and GS) allowing values of up to ≤3x ULN. (D) Serum creatinine: normal ranges from ≤1x ULN to ≤2.5x ULN. (E) Creatinine clearance: normal ranges from ≥30 to ≥60 mL/min. (F) Hemoglobin: normal ranges from ≥8.0 to ≥11.0 ng/dL. (G) Absolute neutrophil count (ANC): normal ranges from ≥750 to ≥1500 cells/uL. (H) Platelets: normal ranges from ≥50,000 to ≥100,000 cells/uL. BCa: breast cancer; NSCLC: non–small cell lung cancer. For a higher-resolution version of this figure, see <xref ref-type="supplementary-material" rid="app15">Multimedia Appendix 15</xref>.</p>
            </caption>
            <graphic xlink:href="ai_v3i1e50800_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Comorbidities</title>
          <p>The presence of comorbidities is a common exclusion criterion in clinical trials; however, natural language descriptions of comorbidities, such as “uncontrollable cardiovascular diseases,” “pulmonary diseases,” and “autoimmune diseases,” can be ambiguous and need domain knowledge to interpret them. We analyzed the hypernyms and their corresponding hyponyms used in BCa trial eligibility criteria. <xref rid="figure4" ref-type="fig">Figure 4</xref> shows the collected hyponyms for each comorbidity class. The presence of second primary malignancies was excluded in almost all trials.</p>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>The heat map graph illustrates the number of clinical trials with each example hyponym for the hypernym comorbidities. Of note, the exception of atopy is mentioned as an autoimmune disease. The group does not include exceptions of other malignancies such as in situ cervical cancer, noninvasive bladder cancer, curative basal or squamous in situ prostate cancer, in situ breast cancer, or resected skin cancer other than melanoma. CD: Crohn disease; CHF: congestive heart failure; CNS: central nervous system; COPD: chronic obstructive pulmonary disease; DVT/PE: deep vein thrombosis/pulmonary embolism; HBV: hepatitis B virus; HCV: hepatitis C virus; MI: myocardial infarction; RA: rheumatoid arthritis; SLE: systemic lupus erythematosus; T1D: type 1 diabetes; T2D: type 2 diabetes; TB: tuberculosis; UC: ulcerative colitis.</p>
            </caption>
            <graphic xlink:href="ai_v3i1e50800_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Prior Therapy, Other Medication, and Biomarker</title>
          <p>By combining all examples of each hypernym, we broke down these hypernyms into actual medication and mutation hyponyms; for instance, we collected <italic>procainamide</italic> or <italic>propafenone</italic> for <italic>current use of antiarrhythmic medication</italic>. Similarly, we collected epidermal growth factor receptor (EGFR) exon 20 <italic>T790M</italic>, <italic>T797S</italic>, <italic>S768I</italic>, or <italic>insertion</italic> for <italic>EGFR mutations resistant to EGFR inhibitors</italic>.</p>
        </sec>
      </sec>
      <sec>
        <title>Development of a Prototype Interface for the Optimization of Protocol Design</title>
        <p>Our study investigated the impact of various criteria on the number of eligible patients. We developed a prototype interface that uses real-world patient information. Using a subset of deidentified cohorts of patients with NSCLC (n=2775), we deployed an eligibility criteria knowledge base that we had constructed in the interface. <xref rid="figure5" ref-type="fig">Figure 5</xref>A displays the selected criteria list, <xref rid="figure5" ref-type="fig">Figure 5</xref>B shows the corresponding patient number, and <xref rid="figure5" ref-type="fig">Figure 5</xref>C illustrates the distribution of patient numbers in each group.</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Screenshots from a prototype interface. (A-B) The selected criteria list and the corresponding number of patients. (C) The distribution of patient numbers in each group. (D) Displayed are eligible patient numbers after sequentially incorporating criteria such as non-squamous histology and stage III and IV, with the further inclusion of aspartate aminotransferase (AST) and alanine transaminase (ALT) laboratory test values of either ≤2.5x upper limit of normal (ULN) or ≤1.0x ULN. (E) The influence of Eastern Cooperative Oncology Group (ECOG) performance status as an additional criterion. Displayed are eligible patient numbers after introducing ECOG scores of 0 to 2 or 0 to 1, with histology, stage, and ALT/AST laboratory test values (&lt;2.5x ULN) as fixed criteria. ANC: absolute neutrophil count; CrCl: creatinine clearance; EGFR: epidermal growth factor receptor; NSCLC: non–small cell lung cancer; PD-1 ab: programmed cell death protein-1. For a higher-resolution version of this figure, see <xref ref-type="supplementary-material" rid="app16">Multimedia Appendix 16</xref>.</p>
          </caption>
          <graphic xlink:href="ai_v3i1e50800_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Sequentially incorporating criteria such as <italic>nonsquamous histology</italic> and <italic>stages III and IV</italic> criteria, we identified 2166 (78.05%) and 426 (15.35%) eligible patients, respectively, from the total pool of 2775 patients with NSCLC. The inclusion of <italic>AST and ALT ≤2.5x ULN</italic> criteria yielded 363 (13.08%) eligible patients from the pool of 2775 patients. Limiting AST and ALT to ≤1.0x ULN resulted in a decreased number of eligible patients (315/2775, 11.35%; <xref rid="figure5" ref-type="fig">Figure 5</xref>D). In addition, we explored the influence of Eastern Cooperative Oncology Group (ECOG) performance status as an additional criterion. With histology, stage, and ALT/AST laboratory test values (&lt;2.5x ULN) as fixed criteria, by introducing ECOG scores of 0 to 2 or 0 to 1, we identified 194 (6.99%) and 151 (5.44%) eligible patients, respectively, from the pool of 2775 patients (<xref rid="figure5" ref-type="fig">Figure 5</xref>E).</p>
        <p>Patient-matching performance was evaluated using precision, recall, and <italic>F</italic><sub>1</sub>-score performance metrics across specific clinical attributes. The average <italic>F</italic><sub>1</sub>-score, computed across 10 attributes from 8 domains (<italic>other primary malignancy</italic>, <italic>congestive heart failure</italic>, <italic>squamous NSCLC</italic>, <italic>organ/tissue transplantation</italic>, <italic>platelets</italic>, programmed death<italic>-1 antibody therapy</italic>, <italic>programmed cell death protein-1 or programmed cell death program-ligand 1 positive, stage groups</italic>, <italic>prior LOT</italic> [line of therapy], and <italic>ECOG</italic>), was 0.94 (range 0.82-1.00 [<xref ref-type="bibr" rid="ref37">37</xref>]).</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>The challenge of achieving a high success rate in clinical trials is an ongoing issue [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref39">39</xref>]. Our study demonstrates the feasibility of a data-driven approach to optimize trial protocols and efficiently identify eligible patients by constructing a comprehensive, EHR-interoperable eligibility criteria knowledge base and integrating EHR data. To accomplish this, we analyzed 3281 clinical trials using our customized deep learning NLP model. We extracted all entities with their attributes and converted the hypernym concepts used in eligibility criteria to EHR-compatible hyponyms along with their corresponding values. We also evaluated the feasibility of optimizing the trial protocol design on the interface we developed. This interface offers an efficient and effective approach for assessing the number of eligible patients across various combinations of eligibility criteria such as different laboratory test values as well as combinations that account for vital signs.</p>
        <p>We developed an eligibility criteria–specific ontology by manually scrutinizing 425 eligibility criteria to be used as a reference for manual annotation during NLP model training. Accurately identifying intricate semantic relationships among entities within eligibility criteria is crucial for constructing an appropriate ontology for precise information extraction, including temporal, arithmetic values, Boolean values, and negation modifiers [<xref ref-type="bibr" rid="ref31">31</xref>]. Our customized NLP pipeline based on the eligibility criteria–specific ontology that we created enabled us to efficiently extract all pertinent attributes across different modalities and diseases, allowing for a more accurate definition of the trial population. To determine the applicability of our ontology generated using cancer clinical trials to other disease domains, we compared the concepts and relations in clinical trials of inflammatory bowel diseases. We observed very similar trends, suggesting that our eligibility criteria–specific ontology can be extended to other types of disease trials.</p>
        <p>Moreover, the corpus of 485 manually annotated and standardized trials in a computable format can be used in eligible patient identification in EHRs.</p>
        <p>Liu et al [<xref ref-type="bibr" rid="ref28">28</xref>] conducted a thorough analysis of 352,100 clinical trials across various disease domains and constructed a knowledge base of clinical trial eligibility criteria. Their comprehensive knowledge base and user-friendly interface showcased the potential of advanced NLP techniques in enhancing eligibility criteria analysis and retrieval. Fang et al [<xref ref-type="bibr" rid="ref40">40</xref>] also adopted a data-driven approach to optimizing clinical trial eligibility criteria in the context of Alzheimer disease and pancreatic cancer domains. Building upon these efforts, our study aimed to further narrow the gap between eligibility criteria and EHRs in multicancer domains, specifically in representing the granularities of eligibility criteria for identifying eligible patients and optimizing protocol designs. This was achieved by transforming hypernyms in the criteria into EHR-compatible hyponyms. We found that most of the primary groups include umbrella terms such as <italic>prior therapy</italic> (eg, proper prior therapy for actionable mutations) and <italic>biomarker</italic> (eg, EGFR inhibitor–resistant mutations). Our study also addressed the challenge of standardizing ambiguous clinical concepts in eligibility criteria for EHR interoperability and patient matching. To overcome this challenge, we converted hypernyms to the <italic>Entity-Attribute-Value</italic> format using prevailing values across different cancer types and modality therapies. We believe that our EHR-interoperable standardized eligibility criteria knowledge base and interface, integrating real-world EHR data, have the potential to improve the automatic screening system. This improvement has the potential to significantly reduce manual extraction efforts. Moreover, specific, computable criteria reduce ambiguity in patient identification and enable the inclusion of a broader range of patients who may qualify for the trial but could be excluded when using more general terms. This can increase patient trial enrollment, ultimately improving the overall success rate of trials. Notably, patients who were given the option to participate in a trial by their physicians demonstrated a significantly higher participation rate of 55% [<xref ref-type="bibr" rid="ref41">41</xref>] compared to the current average of 5% to 8% among patients with cancer [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref43">43</xref>]. The implementation of our <italic>hypernym/hyponym</italic> semantic terminology model can likewise improve the effectiveness of information retrieval from EHRs and other clinical databases in the context of real-world evidence studies.</p>
        <p>Certain criteria such as <italic>histology</italic>, <italic>stage</italic>, <italic>previous treatment</italic>, or <italic>biomarker</italic> are difficult to modify, while others such as vital signs or laboratory test values can be adjusted during the protocol design [<xref ref-type="bibr" rid="ref15">15</xref>]. Our study revealed the impact of modifying laboratory test values while keeping other criteria constant, resulting in fluctuations in the number of eligible patients. Our findings, which demonstrate both the number of trials for different laboratory test value ranges and eligible patient numbers, offer insights for optimizing future protocol design and refining patient selection criteria. Seeking future collaboration with clinicians to conduct a direct comparison between the patient identification results by clinical domain experts and those generated by our prototype holds promise for a more comprehensive and informative evaluation of the prototype’s performance and its potential to enhance patient identification for clinical trials. Furthermore, a careful examination of the cases identified by the prototype can provide an understanding of the nature of false positives and false negatives. This will provide insights into how the prototype may differ in its patient identification results compared to manual extraction. Our eligibility criteria knowledge base can also be leveraged for generating SCAs using EHRs. SCAs, derived from real-world evidence, are regarded as substitutes for experimental control arms in trials [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref18">18</xref>]. The integration of SCAs into single-arm trial data or replacing traditional control arms with SCAs can alleviate the burden of target accrual in trials with low eligible patient numbers, such as rare disease or oncology trials with specific biomarkers. The Food and Drug Administration’s approval of the palbociclib inhibitor for male patients with metastatic BCa based on real-world evidence demonstrates the potential and relevance of SCAs in improving trial design and outcomes [<xref ref-type="bibr" rid="ref44">44</xref>].</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Our study has several limitations to consider. First, we focused on a limited scope, analyzing only 4 different cancer types and exploring extendibility in the context of inflammatory bowel diseases. Future studies should encompass a wider range of cancer types and disease domains for a more comprehensive analysis. Second, while most attributes were well defined, some umbrella terms lacked clear examples in other cancer types, potentially affecting result accuracy. Further manual annotation using knowledge bases could enhance the precision of the attribute tables. Third, our data set may be biased because we solely included industry-sponsored trials, potentially limiting the generalizability of our findings. In addition, the NLP training and test data sets in this study can display similarities owing to the shared attributes among different cancer trials, which heightens concerns regarding potential overfitting. Fourth, we did not address entity logic, and establishing the logic between entities would enhance cohort definition accuracy. Fifth and last, our interface feasibility testing was limited to small cohorts of patients with NSCLC, and the generalizability of our findings to other populations or disease conditions may vary. Furthermore, we did not perform a quantitative evaluation of the accuracy of matched patients although domain experts checked whether the patient information matched the eligibility criteria manually. While our model serves as a valuable illustration of how NLP can contribute to the design of trials across different diseases, we fully acknowledge the indispensable role of clinicians and biomedical researchers in ensuring the integrity of trial criteria. Clinical trials vary in their objectives, encompassing assessments of treatment end points, effectiveness, and other specific goals. The process is far more nuanced than merely adjusting laboratory test values because such modifications can have a substantial impact on the pool of eligible patients. Therefore, a comprehensive approach, considering both the clinical and biomedical aspects, is imperative for robust trial design.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Our study using an EHR-executable eligibility criteria knowledge base and real-world patient information provides valuable insights into the influence of different criteria on the number of eligible patients during the protocol design. The findings highlight the potential of using a data-driven approach that incorporates NLP and EHRs in clinical research.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Classification of attributes into primary entities and their subgroups.</p>
        <media xlink:href="ai_v3i1e50800_app1.png" xlink:title="PNG File , 79 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Classification of attributes into modifier entities and their subgroups.</p>
        <media xlink:href="ai_v3i1e50800_app2.png" xlink:title="PNG File , 62 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>The scheme for the natural language processing–assisted clinical trial analysis.</p>
        <media xlink:href="ai_v3i1e50800_app3.png" xlink:title="PNG File , 50 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Manually annotated non–small cell lung cancer trials.</p>
        <media xlink:href="ai_v3i1e50800_app4.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 184 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Manually annotated breast cancer trials.</p>
        <media xlink:href="ai_v3i1e50800_app5.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 133 KB"/>
      </supplementary-material>
      <supplementary-material id="app6">
        <label>Multimedia Appendix 6</label>
        <p>Manually annotated prostate cancer trials.</p>
        <media xlink:href="ai_v3i1e50800_app6.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 209 KB"/>
      </supplementary-material>
      <supplementary-material id="app7">
        <label>Multimedia Appendix 7</label>
        <p>Manually annotated multiple myeloma trials.</p>
        <media xlink:href="ai_v3i1e50800_app7.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 57 KB"/>
      </supplementary-material>
      <supplementary-material id="app8">
        <label>Multimedia Appendix 8</label>
        <p>Manually annotated ulcerative colitis and Crohn disease trials.</p>
        <media xlink:href="ai_v3i1e50800_app8.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 136 KB"/>
      </supplementary-material>
      <supplementary-material id="app9">
        <label>Multimedia Appendix 9</label>
        <p>Non–small cell lung cancer attributes.</p>
        <media xlink:href="ai_v3i1e50800_app9.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 28 KB"/>
      </supplementary-material>
      <supplementary-material id="app10">
        <label>Multimedia Appendix 10</label>
        <p>Breast cancer attributes.</p>
        <media xlink:href="ai_v3i1e50800_app10.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 28 KB"/>
      </supplementary-material>
      <supplementary-material id="app11">
        <label>Multimedia Appendix 11</label>
        <p>Prostate cancer attributes.</p>
        <media xlink:href="ai_v3i1e50800_app11.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 26 KB"/>
      </supplementary-material>
      <supplementary-material id="app12">
        <label>Multimedia Appendix 12</label>
        <p>Multiple myeloma attributes.</p>
        <media xlink:href="ai_v3i1e50800_app12.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 23 KB"/>
      </supplementary-material>
      <supplementary-material id="app13">
        <label>Multimedia Appendix 13</label>
        <p>Ulcerative colitis attributes.</p>
        <media xlink:href="ai_v3i1e50800_app13.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 29 KB"/>
      </supplementary-material>
      <supplementary-material id="app14">
        <label>Multimedia Appendix 14</label>
        <p>Crohn disease attributes.</p>
        <media xlink:href="ai_v3i1e50800_app14.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 29 KB"/>
      </supplementary-material>
      <supplementary-material id="app15">
        <label>Multimedia Appendix 15</label>
        <p>Clinical trial counts with each unique laboratory test value defining normal organ function. (A-B) Alanine transaminase (ALT) and aspartate aminotransferase (AST): normal ranges from ≤1x upper limit of normal (ULN) to ≤3x ULN, with exceptions for liver diseases (eg, liver metastasis and Gilbert syndrome [GS]) allowing values of up to ≤5x ULN. (C) Total bilirubin: normal ranges from ≤1x ULN to ≤2.5x ULN, with exceptions for liver diseases (eg, liver metastasis and GS) allowing values of up to ≤3x ULN. (D) Serum creatinine: normal ranges from ≤1x ULN to ≤2.5x ULN. (E) Creatinine clearance: normal ranges from ≥30 to ≥60 mL/min. (F) Hemoglobin: normal ranges from ≥8.0 to ≥11.0 ng/dL. (G) Absolute neutrophil count (ANC): normal ranges from ≥750 to ≥1500 cells/uL. (H) Platelets: normal ranges from ≥50,000 to ≥100,000 cells/uL. BCa: breast cancer; NSCLC: non–small cell lung cancer.</p>
        <media xlink:href="ai_v3i1e50800_app15.png" xlink:title="PNG File , 122 KB"/>
      </supplementary-material>
      <supplementary-material id="app16">
        <label>Multimedia Appendix 16</label>
        <p>Screenshots from a prototype interface. (A-B) The selected criteria list and the corresponding number of patients. (C) The distribution of patient numbers in each group. (D) Displayed are eligible patient numbers after sequentially incorporating criteria such as non-squamous histology and stage III and IV, with the further inclusion of aspartate aminotransferase (AST) and alanine transaminase (ALT) laboratory test values of either ≤2.5x upper limit of normal (ULN) or ≤1.0x ULN. (E) The influence of Eastern Cooperative Oncology Group (ECOG) performance status as an additional criterion. Displayed are eligible patient numbers after introducing ECOG scores of 0 to 2 or 0 to 1, with histology, stage, and ALT/AST laboratory test values (&lt;2.5x ULN) as fixed criteria. ANC: absolute neutrophil count; CrCl: creatinine clearance; EGFR: epidermal growth factor receptor; NSCLC: non–small cell lung cancer; PD-1 ab: programmed cell death protein-1.</p>
        <media xlink:href="ai_v3i1e50800_app16.png" xlink:title="PNG File , 330 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ALT</term>
          <def>
            <p>alanine transaminase</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AST</term>
          <def>
            <p>aspartate aminotransferase</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">BCa</term>
          <def>
            <p>breast cancer</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">CD</term>
          <def>
            <p>Crohn disease</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">ECOG</term>
          <def>
            <p>Eastern Cooperative Oncology Group</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">EGFR</term>
          <def>
            <p>epidermal growth factor receptor</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">LOINC</term>
          <def>
            <p>Logical Observation Identifiers, Names, and Codes</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">MM</term>
          <def>
            <p>multiple myeloma</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">NSCLC</term>
          <def>
            <p>non–small cell lung cancer</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">PCa</term>
          <def>
            <p>prostate cancer</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">SCA</term>
          <def>
            <p>synthetic control arm</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">UC</term>
          <def>
            <p>ulcerative colitis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">ULN</term>
          <def>
            <p>upper limit of normal</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The patient data sets analyzed during this study are not publicly available due to patient privacy, security and the Health Insurance Portability and Accountability Act of 1996 (HIPAA) requirement. To enable a complete run of the code shared in this study, a minimum amount of desensitized sample data could be shared with the sharing agreement. Relevant requests should be addressed to ZL. The Prototype interface is available on the internet [<xref ref-type="bibr" rid="ref45">45</xref>]; the R scripts are available on the internet [<xref ref-type="bibr" rid="ref46">46</xref>].</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>KL, ZL, and XW designed the study and wrote the manuscript. KL, YM, and XW reviewed the literature, clinical trial eligibility criteria, and patient notes and constructed the eligibility criteria–specific ontology. KL, ZL, MM, YM, and TW were responsible for the model training, the postprocessing procedure, and the data analysis. TJ, LA, EC, WO, GS, ES, and XW discussed the project and reviewed the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>KL, ZL, TJ, MM, YM, TW, LA, EC, GS, and XW are employees of Sema4. WO and ES are employees of the Icahn School of Medicine at Mount Sinai. WO holds stock in GeneDx. ES was employed by Sema4 and held stock in the company at the time the work in this paper was carried out.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dickson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gagnon</surname>
              <given-names>JP</given-names>
            </name>
          </person-group>
          <article-title>Key factors in the rising cost of new drug discovery and development</article-title>
          <source>Nat Rev Drug Discov</source>
          <year>2004</year>
          <month>05</month>
          <volume>3</volume>
          <issue>5</issue>
          <fpage>417</fpage>
          <lpage>29</lpage>
          <pub-id pub-id-type="doi">10.1038/nrd1382</pub-id>
          <pub-id pub-id-type="medline">15136789</pub-id>
          <pub-id pub-id-type="pii">nrd1382</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wouters</surname>
              <given-names>OJ</given-names>
            </name>
            <name name-style="western">
              <surname>McKee</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Luyten</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Estimated research and development investment needed to bring a new medicine to market, 2009-2018</article-title>
          <source>JAMA</source>
          <year>2020</year>
          <month>03</month>
          <day>03</day>
          <volume>323</volume>
          <issue>9</issue>
          <fpage>844</fpage>
          <lpage>53</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32125404"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jama.2020.1166</pub-id>
          <pub-id pub-id-type="medline">32125404</pub-id>
          <pub-id pub-id-type="pii">2762311</pub-id>
          <pub-id pub-id-type="pmcid">PMC7054832</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pazdur</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sridhara</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Re-evaluating eligibility criteria for oncology clinical trials: analysis of investigational new drug applications in 2015</article-title>
          <source>J Clin Oncol</source>
          <year>2017</year>
          <month>11</month>
          <day>20</day>
          <volume>35</volume>
          <issue>33</issue>
          <fpage>3745</fpage>
          <lpage>52</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28968168"/>
          </comment>
          <pub-id pub-id-type="doi">10.1200/JCO.2017.73.4186</pub-id>
          <pub-id pub-id-type="medline">28968168</pub-id>
          <pub-id pub-id-type="pmcid">PMC5692723</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Garcia</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bisen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>XJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ramalingam</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Schiller</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>DH</given-names>
            </name>
            <name name-style="western">
              <surname>Gerber</surname>
              <given-names>DE</given-names>
            </name>
          </person-group>
          <article-title>Thoracic oncology clinical trial eligibility criteria and requirements continue to increase in number and complexity</article-title>
          <source>J Thorac Oncol</source>
          <year>2017</year>
          <month>10</month>
          <volume>12</volume>
          <issue>10</issue>
          <fpage>1489</fpage>
          <lpage>95</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1556-0864(17)30617-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jtho.2017.07.020</pub-id>
          <pub-id pub-id-type="medline">28802905</pub-id>
          <pub-id pub-id-type="pii">S1556-0864(17)30617-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC5610621</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Osarogiagbon</surname>
              <given-names>RU</given-names>
            </name>
            <name name-style="western">
              <surname>Vega</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Fashoyin-Aje</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wedam</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ison</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Atienza</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>De Porre</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Biswas</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Holloway</surname>
              <given-names>JN</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Wempe</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Schilsky</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Wade</surname>
              <given-names>JL 3rd</given-names>
            </name>
          </person-group>
          <article-title>Modernizing clinical trial eligibility criteria: recommendations of the ASCO-friends of cancer research prior therapies work group</article-title>
          <source>Clin Cancer Res</source>
          <year>2021</year>
          <month>05</month>
          <day>01</day>
          <volume>27</volume>
          <issue>9</issue>
          <fpage>2408</fpage>
          <lpage>15</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33563637"/>
          </comment>
          <pub-id pub-id-type="doi">10.1158/1078-0432.CCR-20-3854</pub-id>
          <pub-id pub-id-type="medline">33563637</pub-id>
          <pub-id pub-id-type="pii">1078-0432.CCR-20-3854</pub-id>
          <pub-id pub-id-type="pmcid">PMC8170959</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stensland</surname>
              <given-names>KD</given-names>
            </name>
            <name name-style="western">
              <surname>McBride</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Latif</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wisnivesky</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hendricks</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Roper</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Boffetta</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Oh</surname>
              <given-names>WK</given-names>
            </name>
            <name name-style="western">
              <surname>Galsky</surname>
              <given-names>MD</given-names>
            </name>
          </person-group>
          <article-title>Adult cancer clinical trials that fail to complete: an epidemic?</article-title>
          <source>J Natl Cancer Inst</source>
          <year>2014</year>
          <month>09</month>
          <volume>106</volume>
          <issue>9</issue>
          <fpage>dju229</fpage>
          <pub-id pub-id-type="doi">10.1093/jnci/dju229</pub-id>
          <pub-id pub-id-type="medline">25190726</pub-id>
          <pub-id pub-id-type="pii">dju229</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fogel</surname>
              <given-names>DB</given-names>
            </name>
          </person-group>
          <article-title>Factors associated with clinical trials that fail and opportunities for improving the likelihood of success: a review</article-title>
          <source>Contemp Clin Trials Commun</source>
          <year>2018</year>
          <month>09</month>
          <volume>11</volume>
          <fpage>156</fpage>
          <lpage>64</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2451-8654(18)30069-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.conctc.2018.08.001</pub-id>
          <pub-id pub-id-type="medline">30112460</pub-id>
          <pub-id pub-id-type="pii">S2451-8654(18)30069-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC6092479</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nipp</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Paskett</surname>
              <given-names>ED</given-names>
            </name>
          </person-group>
          <article-title>Overcoming barriers to clinical trial enrollment</article-title>
          <source>Am Soc Clin Oncol Educ Book</source>
          <year>2019</year>
          <month>05</month>
          <volume>39</volume>
          <fpage>105</fpage>
          <lpage>14</lpage>
          <pub-id pub-id-type="doi">10.1200/edbk_243729</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brøgger-Mikkelsen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zibert</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Andersen</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Thomsen</surname>
              <given-names>SF</given-names>
            </name>
          </person-group>
          <article-title>Online patient recruitment in clinical trials: systematic review and meta-analysis</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>11</month>
          <day>04</day>
          <volume>22</volume>
          <issue>11</issue>
          <fpage>e22179</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/11/e22179/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/22179</pub-id>
          <pub-id pub-id-type="medline">33146627</pub-id>
          <pub-id pub-id-type="pii">v22i11e22179</pub-id>
          <pub-id pub-id-type="pmcid">PMC7673977</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Naci</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ioannidis</surname>
              <given-names>JP</given-names>
            </name>
          </person-group>
          <article-title>How good is "evidence" from clinical studies of drug effects and why might such evidence fail in the prediction of the clinical utility of drugs?</article-title>
          <source>Annu Rev Pharmacol Toxicol</source>
          <year>2015</year>
          <volume>55</volume>
          <fpage>169</fpage>
          <lpage>89</lpage>
          <pub-id pub-id-type="doi">10.1146/annurev-pharmtox-010814-124614</pub-id>
          <pub-id pub-id-type="medline">25149917</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Heneghan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Goldacre</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Mahtani</surname>
              <given-names>KR</given-names>
            </name>
          </person-group>
          <article-title>Why clinical trial outcomes fail to translate into benefits for patients</article-title>
          <source>Trials</source>
          <year>2017</year>
          <month>03</month>
          <day>14</day>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>122</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://trialsjournal.biomedcentral.com/articles/10.1186/s13063-017-1870-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13063-017-1870-2</pub-id>
          <pub-id pub-id-type="medline">28288676</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13063-017-1870-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC5348914</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Van Spall</surname>
              <given-names>HG</given-names>
            </name>
            <name name-style="western">
              <surname>Toren</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kiss</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fowler</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <article-title>Eligibility criteria of randomized controlled trials published in high-impact general medical journals: a systematic sampling review</article-title>
          <source>JAMA</source>
          <year>2007</year>
          <month>03</month>
          <day>21</day>
          <volume>297</volume>
          <issue>11</issue>
          <fpage>1233</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.297.11.1233</pub-id>
          <pub-id pub-id-type="medline">17374817</pub-id>
          <pub-id pub-id-type="pii">297/11/1233</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>PB</given-names>
            </name>
            <name name-style="western">
              <surname>Goldstein</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chakrabarti</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Koski</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Correlating eligibility criteria generalizability and adverse events using Big Data for patients and clinical trials</article-title>
          <source>Ann N Y Acad Sci</source>
          <year>2017</year>
          <month>01</month>
          <volume>1387</volume>
          <issue>1</issue>
          <fpage>34</fpage>
          <lpage>43</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27598694"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/nyas.13195</pub-id>
          <pub-id pub-id-type="medline">27598694</pub-id>
          <pub-id pub-id-type="pmcid">PMC5266625</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Begg</surname>
              <given-names>CB</given-names>
            </name>
          </person-group>
          <article-title>Cancer clinical trials in the USA: patient eligibility, generalizability of results and technology transfer</article-title>
          <source>Bull Cancer</source>
          <year>1987</year>
          <volume>74</volume>
          <issue>2</issue>
          <fpage>197</fpage>
          <lpage>203</lpage>
          <pub-id pub-id-type="medline">3607303</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rizzo</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Whipple</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pal</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Pineda</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Arnieri</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Capra</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Copping</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Evaluating eligibility criteria of oncology trials using real-world data and AI</article-title>
          <source>Nature</source>
          <year>2021</year>
          <month>04</month>
          <volume>592</volume>
          <issue>7855</issue>
          <fpage>629</fpage>
          <lpage>33</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33828294"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41586-021-03430-5</pub-id>
          <pub-id pub-id-type="medline">33828294</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41586-021-03430-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC9007176</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ko</surname>
              <given-names>YA</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Quyyumi</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Waller</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Higgins</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ziegler</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Brigham</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>GS</given-names>
            </name>
          </person-group>
          <article-title>Developing a synthetic control group using electronic health records: application to a single-arm lifestyle intervention study</article-title>
          <source>Prev Med Rep</source>
          <year>2021</year>
          <month>12</month>
          <volume>24</volume>
          <fpage>101572</fpage>
          <pub-id pub-id-type="doi">10.1016/j.pmedr.2021.101572</pub-id>
          <pub-id pub-id-type="medline">34976636</pub-id>
          <pub-id pub-id-type="pii">S2211-3355(21)00262-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC8683890</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carrigan</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Whipple</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Capra</surname>
              <given-names>WB</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Arnieri</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Copping</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rothman</surname>
              <given-names>KJ</given-names>
            </name>
          </person-group>
          <article-title>Using electronic health records to derive control arms for early phase single-arm lung cancer trials: proof-of-concept in randomized controlled trials</article-title>
          <source>Clin Pharmacol Ther</source>
          <year>2020</year>
          <month>02</month>
          <volume>107</volume>
          <issue>2</issue>
          <fpage>369</fpage>
          <lpage>77</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31350853"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/cpt.1586</pub-id>
          <pub-id pub-id-type="medline">31350853</pub-id>
          <pub-id pub-id-type="pmcid">PMC7006884</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>AY</given-names>
            </name>
            <name name-style="western">
              <surname>Müller</surname>
              <given-names>PL</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Olvera-Barrios</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Warwick</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Heeren</surname>
              <given-names>TF</given-names>
            </name>
            <name name-style="western">
              <surname>Egan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Tufail</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Contextualizing single-arm trials with real-world data: an emulated target trial comparing therapies for neovascular age-related macular degeneration</article-title>
          <source>Clin Transl Sci</source>
          <year>2021</year>
          <month>05</month>
          <volume>14</volume>
          <issue>3</issue>
          <fpage>1166</fpage>
          <lpage>75</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33421321"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/cts.12974</pub-id>
          <pub-id pub-id-type="medline">33421321</pub-id>
          <pub-id pub-id-type="pmcid">PMC8212729</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>SW</given-names>
            </name>
            <name name-style="western">
              <surname>Sim</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Richesson</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Formal representation of eligibility criteria: a literature review</article-title>
          <source>J Biomed Inform</source>
          <year>2010</year>
          <month>06</month>
          <volume>43</volume>
          <issue>3</issue>
          <fpage>451</fpage>
          <lpage>67</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(09)00159-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2009.12.004</pub-id>
          <pub-id pub-id-type="medline">20034594</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(09)00159-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC2878905</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chondrogiannis</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Andronikou</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Tagaris</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Karanastasis</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Varvarigou</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tsuji</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A novel semantic representation for eligibility criteria in clinical trials</article-title>
          <source>J Biomed Inform</source>
          <year>2017</year>
          <month>05</month>
          <volume>69</volume>
          <fpage>10</fpage>
          <lpage>23</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(17)30062-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2017.03.013</pub-id>
          <pub-id pub-id-type="medline">28336477</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(17)30062-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Su</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>A review of research on eligibility criteria for clinical trials</article-title>
          <source>Clin Exp Med</source>
          <year>2023</year>
          <month>10</month>
          <volume>23</volume>
          <issue>6</issue>
          <fpage>1867</fpage>
          <lpage>79</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36602707"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s10238-022-00975-1</pub-id>
          <pub-id pub-id-type="medline">36602707</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10238-022-00975-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC9815064</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>SW</given-names>
            </name>
            <name name-style="western">
              <surname>Peleg</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Carini</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bobak</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ross</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rubin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sim</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>A practical method for transforming free-text eligibility criteria into computable criteria</article-title>
          <source>J Biomed Inform</source>
          <year>2011</year>
          <month>04</month>
          <volume>44</volume>
          <issue>2</issue>
          <fpage>239</fpage>
          <lpage>50</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(10)00139-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2010.09.007</pub-id>
          <pub-id pub-id-type="medline">20851207</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(10)00139-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC3129371</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Boland</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Theodoratos</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>SB</given-names>
            </name>
          </person-group>
          <article-title>EliXR: an approach to eligibility criteria extraction and representation</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2011</year>
          <month>12</month>
          <volume>18 Suppl 1</volume>
          <issue>Suppl 1</issue>
          <fpage>i116</fpage>
          <lpage>24</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/21807647"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000321</pub-id>
          <pub-id pub-id-type="medline">21807647</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2011-000321</pub-id>
          <pub-id pub-id-type="pmcid">PMC3241167</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hruby</surname>
              <given-names>GW</given-names>
            </name>
            <name name-style="western">
              <surname>Rusanov</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>EliIE: an open-source information extraction system for clinical trial eligibility criteria</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2017</year>
          <month>11</month>
          <day>01</day>
          <volume>24</volume>
          <issue>6</issue>
          <fpage>1062</fpage>
          <lpage>71</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28379377"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocx019</pub-id>
          <pub-id pub-id-type="medline">28379377</pub-id>
          <pub-id pub-id-type="pii">3098256</pub-id>
          <pub-id pub-id-type="pmcid">PMC6259668</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tian</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Erdengasileng</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Transformer-based named entity recognition for parsing clinical trial eligibility criteria</article-title>
          <source>ACM BCB</source>
          <year>2021</year>
          <month>08</month>
          <volume>2021</volume>
          <fpage>49</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34414397"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3459930.3469560</pub-id>
          <pub-id pub-id-type="medline">34414397</pub-id>
          <pub-id pub-id-type="pii">49</pub-id>
          <pub-id pub-id-type="pmcid">PMC8373041</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kreimeyer</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Foster</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pandey</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Arya</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Halford</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>SF</given-names>
            </name>
            <name name-style="western">
              <surname>Forshee</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Walderhaug</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Botsis</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing systems for capturing and standardizing unstructured clinical information: a systematic review</article-title>
          <source>J Biomed Inform</source>
          <year>2017</year>
          <month>09</month>
          <volume>73</volume>
          <fpage>14</fpage>
          <lpage>29</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(17)30168-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2017.07.012</pub-id>
          <pub-id pub-id-type="medline">28729030</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(17)30168-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC6864736</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>PB</given-names>
            </name>
            <name name-style="western">
              <surname>Ta</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Hardin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Makadia</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Criteria2Query: a natural language interface to clinical databases for cohort definition</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2019</year>
          <month>04</month>
          <day>01</day>
          <volume>26</volume>
          <issue>4</issue>
          <fpage>294</fpage>
          <lpage>305</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30753493"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocy178</pub-id>
          <pub-id pub-id-type="medline">30753493</pub-id>
          <pub-id pub-id-type="pii">5308980</pub-id>
          <pub-id pub-id-type="pmcid">PMC6402359</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Butler</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>A knowledge base of clinical trial eligibility criteria</article-title>
          <source>J Biomed Inform</source>
          <year>2021</year>
          <month>05</month>
          <volume>117</volume>
          <fpage>103771</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(21)00100-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2021.103771</pub-id>
          <pub-id pub-id-type="medline">33813032</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(21)00100-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC8407851</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kury</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Butler</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Sim</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Carini</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Chia, a large annotated corpus of clinical trial eligibility criteria</article-title>
          <source>Sci Data</source>
          <year>2020</year>
          <month>08</month>
          <day>27</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>281</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41597-020-00620-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41597-020-00620-0</pub-id>
          <pub-id pub-id-type="medline">32855408</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41597-020-00620-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC7452886</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dobbins</surname>
              <given-names>NJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mullen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Uzuner</surname>
              <given-names>Ö</given-names>
            </name>
            <name name-style="western">
              <surname>Yetisgen</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The Leaf Clinical Trials Corpus: a new resource for query generation from clinical trial eligibility criteria</article-title>
          <source>Sci Data</source>
          <year>2022</year>
          <month>08</month>
          <day>11</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>490</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41597-022-01521-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41597-022-01521-0</pub-id>
          <pub-id pub-id-type="medline">35953524</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41597-022-01521-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC9372145</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ross</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Carini</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sim</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Analysis of eligibility criteria complexity in clinical trials</article-title>
          <source>Summit Transl Bioinform</source>
          <year>2010</year>
          <month>03</month>
          <day>01</day>
          <volume>2010</volume>
          <fpage>46</fpage>
          <lpage>50</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/21347148"/>
          </comment>
          <pub-id pub-id-type="medline">21347148</pub-id>
          <pub-id pub-id-type="pmcid">PMC3041539</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sim</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Olasov</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Carini</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>An ontology of randomized controlled trials for evidence-based practice: content specification and evaluation using the competency decomposition method</article-title>
          <source>J Biomed Inform</source>
          <year>2004</year>
          <month>04</month>
          <volume>37</volume>
          <issue>2</issue>
          <fpage>108</fpage>
          <lpage>19</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532046404000309"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2004.03.001</pub-id>
          <pub-id pub-id-type="medline">15120657</pub-id>
          <pub-id pub-id-type="pii">S1532046404000309</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Chandran</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Kalsekar</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Laxmanan</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Higashi</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Jun</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mai</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Gilman</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ai</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Aggarwal</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Oh</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Stolovitzky</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Schadt</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Detecting ground glass opacity features in patients with lung cancer: automated extraction and longitudinal analysis via deep learning–based natural language processing</article-title>
          <source>JMIR AI</source>
          <year>2023</year>
          <month>6</month>
          <day>1</day>
          <volume>2</volume>
          <fpage>e44537</fpage>
          <pub-id pub-id-type="doi">10.2196/44537</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Soysal</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Pakhomov</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>CLAMP - a toolkit for efficiently building customized clinical natural language processing pipelines</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2018</year>
          <month>03</month>
          <day>01</day>
          <volume>25</volume>
          <issue>3</issue>
          <fpage>331</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29186491"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocx132</pub-id>
          <pub-id pub-id-type="medline">29186491</pub-id>
          <pub-id pub-id-type="pii">4657212</pub-id>
          <pub-id pub-id-type="pmcid">PMC7378877</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alfattni</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Peek</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Nenadic</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Attention-based bidirectional long short-term memory networks for extracting temporal relationships from clinical discharge summaries</article-title>
          <source>J Biomed Inform</source>
          <year>2021</year>
          <month>11</month>
          <volume>123</volume>
          <fpage>103915</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(21)00244-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2021.103915</pub-id>
          <pub-id pub-id-type="medline">34600144</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(21)00244-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xiang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Applying a deep learning-based sequence labeling approach to detect attributes of medical concepts in clinical text</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2019</year>
          <month>12</month>
          <day>05</day>
          <volume>19</volume>
          <issue>Suppl 5</issue>
          <fpage>236</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-019-0937-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-019-0937-2</pub-id>
          <pub-id pub-id-type="medline">31801529</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-019-0937-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC6894107</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mai</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Raja</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Higashi</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Jun</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ai</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Calay</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Oh</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Schadt</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Establishing the automatic identification of clinical trial cohorts from electronic health records by matching normalized eligibility criteria and patient clinical characteristics</article-title>
          <source>medRxiv</source>
          <comment>Preprint posted online April 09, 2024</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.medrxiv.org/content/10.1101/2024.02.28.24303396v2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1101/2024.02.28.24303396</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hay</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>DW</given-names>
            </name>
            <name name-style="western">
              <surname>Craighead</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Economides</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenthal</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Clinical development success rates for investigational drugs</article-title>
          <source>Nat Biotechnol</source>
          <year>2014</year>
          <month>01</month>
          <volume>32</volume>
          <issue>1</issue>
          <fpage>40</fpage>
          <lpage>51</lpage>
          <pub-id pub-id-type="doi">10.1038/nbt.2786</pub-id>
          <pub-id pub-id-type="medline">24406927</pub-id>
          <pub-id pub-id-type="pii">nbt.2786</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Siah</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Lo</surname>
              <given-names>AW</given-names>
            </name>
          </person-group>
          <article-title>Estimation of clinical trial success rates and related parameters</article-title>
          <source>Biostatistics</source>
          <year>2019</year>
          <month>04</month>
          <day>01</day>
          <volume>20</volume>
          <issue>2</issue>
          <fpage>273</fpage>
          <lpage>86</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29394327"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/biostatistics/kxx069</pub-id>
          <pub-id pub-id-type="medline">29394327</pub-id>
          <pub-id pub-id-type="pii">4817524</pub-id>
          <pub-id pub-id-type="pmcid">PMC6409418</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Idnay</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ta</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Marder</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>A data-driven approach to optimizing clinical study eligibility criteria</article-title>
          <source>J Biomed Inform</source>
          <year>2023</year>
          <month>06</month>
          <volume>142</volume>
          <fpage>104375</fpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2023.104375</pub-id>
          <pub-id pub-id-type="medline">37141977</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(23)00096-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC10262300</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Unger</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Hershman</surname>
              <given-names>DL</given-names>
            </name>
            <name name-style="western">
              <surname>Till</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Minasian</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Osarogiagbon</surname>
              <given-names>RU</given-names>
            </name>
            <name name-style="western">
              <surname>Fleury</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Vaidya</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>"When offered to participate": a systematic review and meta-analysis of patient agreement to participate in cancer clinical trials</article-title>
          <source>J Natl Cancer Inst</source>
          <year>2021</year>
          <month>03</month>
          <day>01</day>
          <volume>113</volume>
          <issue>3</issue>
          <fpage>244</fpage>
          <lpage>57</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33022716"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jnci/djaa155</pub-id>
          <pub-id pub-id-type="medline">33022716</pub-id>
          <pub-id pub-id-type="pii">5918345</pub-id>
          <pub-id pub-id-type="pmcid">PMC7936064</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Unger</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Vaidya</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hershman</surname>
              <given-names>DL</given-names>
            </name>
            <name name-style="western">
              <surname>Minasian</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Fleury</surname>
              <given-names>ME</given-names>
            </name>
          </person-group>
          <article-title>Systematic review and meta-analysis of the magnitude of structural, clinical, and physician and patient barriers to cancer clinical trial participation</article-title>
          <source>J Natl Cancer Inst</source>
          <year>2019</year>
          <month>03</month>
          <day>01</day>
          <volume>111</volume>
          <issue>3</issue>
          <fpage>245</fpage>
          <lpage>55</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30856272"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jnci/djy221</pub-id>
          <pub-id pub-id-type="medline">30856272</pub-id>
          <pub-id pub-id-type="pii">5307078</pub-id>
          <pub-id pub-id-type="pmcid">PMC6410951</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Unger</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Cook</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Tai</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bleyer</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>The role of clinical trial participation in cancer research: barriers, evidence, and strategies</article-title>
          <source>Am Soc Clin Oncol Educ Book</source>
          <year>2016</year>
          <month>05</month>
          <volume>35</volume>
          <fpage>185</fpage>
          <lpage>98</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ascopubs.org/doi/10.1200/EDBK_156686?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:crossref.org&amp;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1200/EDBK_156686</pub-id>
          <pub-id pub-id-type="medline">27249699</pub-id>
          <pub-id pub-id-type="pii">156686</pub-id>
          <pub-id pub-id-type="pmcid">PMC5495113</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wedam</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fashoyin-Aje</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Bloomquist</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sridhara</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Goldberg</surname>
              <given-names>KB</given-names>
            </name>
            <name name-style="western">
              <surname>Theoret</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Amiri-Kordestani</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Pazdur</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Beaver</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>FDA approval summary: palbociclib for male patients with metastatic breast cancer</article-title>
          <source>Clin Cancer Res</source>
          <year>2020</year>
          <month>03</month>
          <day>15</day>
          <volume>26</volume>
          <issue>6</issue>
          <fpage>1208</fpage>
          <lpage>12</lpage>
          <pub-id pub-id-type="doi">10.1158/1078-0432.CCR-19-2580</pub-id>
          <pub-id pub-id-type="medline">31649043</pub-id>
          <pub-id pub-id-type="pii">1078-0432.CCR-19-2580</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="web">
          <article-title>Clinical trial eligibility design</article-title>
          <source>Shiny Apps</source>
          <access-date>2024-06-18</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://zongzhi-liu.shinyapps.io/trialdesign/">https://zongzhi-liu.shinyapps.io/trialdesign/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="web">
          <article-title>trialdesign</article-title>
          <source>GitHub</source>
          <access-date>2024-06-18</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/zz2liu/trialdesign">https://github.com/zz2liu/trialdesign</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
