<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR AI</journal-id>
      <journal-title>JMIR AI</journal-title>
      <issn pub-type="epub">2817-1705</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v2i1e44779</article-id>
      <article-id pub-id-type="pmid">38875572</article-id>
      <article-id pub-id-type="doi">10.2196/44779</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>A Scalable Radiomics- and Natural Language Processing–Based Machine Learning Pipeline to Distinguish Between Painful and Painless Thoracic Spinal Bone Metastases: Retrospective Algorithm Development and Validation Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>El Emam</surname>
            <given-names>Khaled</given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Malin</surname>
            <given-names>Bradley</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Hmouda</surname>
            <given-names>Eljilani</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Wang</surname>
            <given-names>Shu-Yi</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Elbattah</surname>
            <given-names>Mahmoud</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Naseri</surname>
            <given-names>Hossein</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Medical Physics Unit</institution>
            <institution>McGill University Health Centre</institution>
            <addr-line>Cedars Cancer Centre</addr-line>
            <addr-line>1001 boul Décarie Montréal</addr-line>
            <addr-line>Montreal, QC, H4A 3J1</addr-line>
            <country>Canada</country>
            <phone>1 514 934 1934 ext 44158</phone>
            <email>3naseri@gmail.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0554-4173</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Skamene</surname>
            <given-names>Sonia</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6318-8982</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Tolba</surname>
            <given-names>Marwan</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2812-7348</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Faye</surname>
            <given-names>Mame Daro</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3274-2055</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Ramia</surname>
            <given-names>Paul</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5949-2730</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Khriguian</surname>
            <given-names>Julia</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6472-679X</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>David</surname>
            <given-names>Marc</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0008-9437-9520</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Kildea</surname>
            <given-names>John</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7084-1425</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Medical Physics Unit</institution>
        <institution>McGill University Health Centre</institution>
        <addr-line>Montreal, QC</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Division of Radiation Oncology</institution>
        <institution>McGill University Health Centre</institution>
        <addr-line>Montreal, QC</addr-line>
        <country>Canada</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Hossein Naseri <email>3naseri@gmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>22</day>
        <month>5</month>
        <year>2023</year>
      </pub-date>
      <volume>2</volume>
      <elocation-id>e44779</elocation-id>
      <history>
        <date date-type="received">
          <day>2</day>
          <month>12</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>6</day>
          <month>2</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>12</day>
          <month>3</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>1</day>
          <month>4</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Hossein Naseri, Sonia Skamene, Marwan Tolba, Mame Daro Faye, Paul Ramia, Julia Khriguian, Marc David, John Kildea. Originally published in JMIR AI (https://ai.jmir.org), 22.05.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR AI, is properly cited. The complete bibliographic information, a link to the original publication on https://www.ai.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://ai.jmir.org/2023/1/e44779" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>The identification of objective pain biomarkers can contribute to an improved understanding of pain, as well as its prognosis and better management. Hence, it has the potential to improve the quality of life of patients with cancer. Artificial intelligence can aid in the extraction of objective pain biomarkers for patients with cancer with bone metastases (BMs).</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to develop and evaluate a scalable natural language processing (NLP)– and radiomics-based machine learning pipeline to differentiate between painless and painful BM lesions in simulation computed tomography (CT) images using imaging features (biomarkers) extracted from lesion center point–based regions of interest (ROIs).</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Patients treated at our comprehensive cancer center who received palliative radiotherapy for thoracic spine BM between January 2016 and September 2019 were included in this retrospective study. Physician-reported pain scores were extracted automatically from radiation oncology consultation notes using an NLP pipeline. BM center points were manually pinpointed on CT images by radiation oncologists. Nested ROIs with various diameters were automatically delineated around these expert-identified BM center points, and radiomics features were extracted from each ROI. Synthetic Minority Oversampling Technique resampling, the Least Absolute Shrinkage And Selection Operator feature selection method, and various machine learning classifiers were evaluated using precision, recall, <italic>F</italic><sub>1</sub>-score, and area under the receiver operating characteristic curve.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Radiation therapy consultation notes and simulation CT images of 176 patients (mean age 66, SD 14 years; 95 males) with thoracic spine BM were included in this study. After BM center point identification, 107 radiomics features were extracted from each spherical ROI using pyradiomics. Data were divided into 70% and 30% training and hold-out test sets, respectively. In the test set, the accuracy, sensitivity, specificity, and area under the receiver operating characteristic curve of our best performing model (neural network classifier on an ensemble ROI) were 0.82 (132/163), 0.59 (16/27), 0.85 (116/136), and 0.83, respectively.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our NLP- and radiomics-based machine learning pipeline was successful in differentiating between painful and painless BM lesions. It is intrinsically scalable by using NLP to extract pain scores from clinical notes and by requiring only center points to identify BM lesions in CT images.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>cancer</kwd>
        <kwd>pain</kwd>
        <kwd>palliative care</kwd>
        <kwd>radiotherapy</kwd>
        <kwd>bone metastases</kwd>
        <kwd>radiomics</kwd>
        <kwd>natural language processing</kwd>
        <kwd>machine learning</kwd>
        <kwd>artificial intelligent</kwd>
        <kwd>radiation therapy</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Overview</title>
        <p>Most patients with cancer with bone metastasis (BM) experience pain [<xref ref-type="bibr" rid="ref1">1</xref>] and most receive radiotherapy to control it [<xref ref-type="bibr" rid="ref2">2</xref>]. But, it has been shown that due to the subjective and qualitative nature of the pain, clinicians often underestimate pain [<xref ref-type="bibr" rid="ref3">3</xref>]. As a result, many patients with BM receive radiotherapy after their pain has already become debilitating [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
        <p>Although patient-reported outcomes can be used to obtain pain scores directly from patients themselves, the efficacy of these pain scores is limited due to the fact that these ratings are highly qualitative and subjective [<xref ref-type="bibr" rid="ref5">5</xref>]. Because of this, it is desirable to have pain scoring systems that are more objective. The goal of this study was to explore ways to automatically and objectively quantify pain associated with BMs using computed tomography (CT) images.</p>
        <p>We hypothesized that tumor features extracted from CT images of BMs contain imaging biomarkers that may be used to objectively identify BM-associated pain. These pain biomarkers may provide the opportunity to develop objective pain scoring tools to aid in the diagnosis, treatment, understanding, and prognosis of BM pain.</p>
      </sec>
      <sec>
        <title>Background</title>
        <p>The search for imaging and nonimaging pain biomarkers has been the focus of numerous studies [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref12">12</xref>]. Various studies [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref21">21</xref>] have shown how artificial intelligence (AI), including machine learning and radiomics, can be used to understand and quantify pain. For example, Mashayekhi et al [<xref ref-type="bibr" rid="ref22">22</xref>] showed that radiomic features extracted from the CT images of the pancreas can help to identify functional abdominal pain in patients. Vedantam et al [<xref ref-type="bibr" rid="ref23">23</xref>] explored the viability of using radiomics features extracted from magnetic resonance images to detect pain following percutaneous cordotomy. At least 1 study [<xref ref-type="bibr" rid="ref13">13</xref>] has reported using radiomics to identify painful metastatic lesions in radiographic images. However, we found no reports in the literature of a scalable approach that can be used efficiently on a large set of unlabeled patient data. To the best of our knowledge, our work is the first to combine natural language processing (NLP) and radiomics to enable an efficient and scalable pain identification pipeline using unstructured data.</p>
        <p>A fundamental challenge in developing any AI model for use in medicine is the need to obtain sufficient patient data for training and testing. For example, the data set used by Wakabayashi et al in the study that we mentioned earlier [<xref ref-type="bibr" rid="ref13">13</xref>], was limited to 69 patients. One limiting factor is obtaining standard patient-reported pain scores for use as ground-truth data, and another limiting factor is obtaining segmented images from which to extract tumor biomarkers. For the work reported in this paper, we overcame the data set size limitation by using 2 novel strategies. First, by combining NLP with radiomics, we quickly mined pain scores from clinical notes and used these NLP-extracted scores to label our radiomics features for supervised learning. Second, by asking our clinical colleagues to pinpoint only the center points of BM lesions in radiotherapy simulation CT images, we maximized the number of lesions identified in the time available. In the medical field, NLP has shown promising results in extracting biomedical information and clinical outcomes such as pain from unstructured text data [<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref26">26</xref>]. Moreover, as we reported previously [<xref ref-type="bibr" rid="ref21">21</xref>], by automatically delineating geometrical regions around BM lesion center points, it is possible to successfully extract radiomics features for robust BM lesion detection. In this study, we report how our combined radiomics-NLP machine learning pipeline can successfully identify pain in radiotherapy simulation CT images of patients with cancer with BMs.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Ethical Considerations</title>
        <p>This retrospective study was approved by the research ethics board of the McGill University Health Centre (2020-5899) with the waiver of informed consent. We confirm that the entire research was performed in accordance with research ethics board’s guidelines and regulations.</p>
      </sec>
      <sec>
        <title>Data Selection</title>
        <p>Our patient-selection process is outlined in <xref rid="figure1" ref-type="fig">Figure 1</xref>. The initial number of 200 pairs of radiation oncology consultation notes and CT images of patients with spinal BM were included in this study based on the minimum sample size calculation as explained in Section A.1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> [<xref ref-type="bibr" rid="ref27">27</xref>]. In total, 120 of the notes and all 200 of the CT images from this study were independently used in 2 studies we previously reported on [<xref ref-type="bibr" rid="ref21">21</xref>-<xref ref-type="bibr" rid="ref25">25</xref>]. The first [<xref ref-type="bibr" rid="ref25">25</xref>] of these studies showed the feasibility of extracting pain from consultation notes of patients with cancer, using NLP. The second [<xref ref-type="bibr" rid="ref21">21</xref>] demonstrated the feasibility of using lesion center point–based radiomics models to differentiate healthy and metastatic bone lesions in CT scans of patients with BMs. This study combined the data and results from these 2 prior studies and expanded upon them to build an NLP- and radiomics-based model to detect pain using the CT scans of patients.</p>
        <p>We searched our institution’s Oncology Information System for the radiotherapy plans of patients diagnosed with a “secondary malignant neoplasm of bone” between January 2016 and September 2019. From the retrieved list, we selected those who were treated for thoracic spinal BM. Then, we retrieved the corresponding consultation notes and simulation CT images. A note-image pair was included if (1) the note was in English, (2) pain was documented, (3) the simulation CT image was taken up to 10 days post consultation, and (4) simulation CT revealed BM lesions in the thoracic spine. Patients with multiple but nonoverlapping note-image pairs were considered independent samples. We only considered the same patients as new participants if they had CT scans and associated consultation notes for BM lesions in different areas of their spines. As a result, each BM lesion was included only once in our study. Also, it should be noted that palliative patients normally have their simulation CT scan (for treatment planning) on the same day or within a few days after the consultation, and radiotherapy is delivered on the same day or within a few days after treatment planning. To assure that there is no change in the BM lesion structure or pain status, we did not allow more than a 10-day gap between the two. Figure A1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> displays the distribution of the time interval between the radiotherapy consultation and CT acquisition dates.</p>
        <p>We randomly assigned note-image pairs to the training or cross-validation set (approximately 70%) or the holdout test set (approximately 30%). We used stratified randomization to preserve the original sample ratio between pain labels in each sample set. In addition, we performed a paired <italic>t</italic> test and a chi-square analysis [<xref ref-type="bibr" rid="ref28">28</xref>] to ensure that there was no systematic bias in any of our sample sets regarding gender, age, or primary cancer type. Patient demographics are presented in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>The patient selection criteria used to obtain the radiotherapy consultation notes and simulation computed tomography (CT) images that formed our training and test data sets. The initial number of 200 note-image pairs included in this study was based on the minimum sample size calculation as explained in Section A.1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. BM: bone metastases; DICOM: Digital Imaging and Communications in Medicine; RT: radiotherapy; T-spine: thoracic spine. *Four patients had pairs in both the training and test sets.</p>
          </caption>
          <graphic xlink:href="ai_v2i1e44779_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Patient demographics in the training and test sets.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="350"/>
            <col width="300"/>
            <col width="160"/>
            <col width="0"/>
            <col width="160"/>
            <thead>
              <tr valign="bottom">
                <td colspan="2">Characteristics</td>
                <td>Training and validation set (n=121)</td>
                <td>Test set (n=55)</td>
                <td colspan="2"><italic>P</italic> value<sup>a</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="5">
                  <bold>Gender, n (%)</bold>
                </td>
                <td>N/A<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td>56 (46)</td>
                <td>25 (45)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td>65 (54)</td>
                <td>30 (55)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Age (years), mean (SD)<sup>c</sup></bold>
                </td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td>63 (14)</td>
                <td>64 (12)</td>
                <td colspan="2">.99</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td>67 (14)</td>
                <td>64 (13)</td>
                <td colspan="2">.72</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Primary cancer type, n (%)</bold>
                </td>
                <td>.06</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Lung</td>
                <td>32 (26)</td>
                <td>20 (36)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Breast</td>
                <td>23 (19)</td>
                <td>11 (20)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Prostate</td>
                <td>19 (16)</td>
                <td>5 (9)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Multiple myeloma</td>
                <td>8 (7)</td>
                <td>6 (11)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Renal cell carcinoma</td>
                <td>7 (6)</td>
                <td>2 (4)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Other and unknown</td>
                <td>64 (53)</td>
                <td>31 (56)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Bone metastasis lesions, n (%)</bold>
                </td>
                <td>.42</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Lytic</td>
                <td>220 (52)</td>
                <td>76 (47)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Blastic</td>
                <td>122 (29)</td>
                <td>57 (35)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Mix</td>
                <td>81 (19)</td>
                <td>30 (18)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Pain label, n (%)</bold>
                </td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Pain</td>
                <td>357 (84)</td>
                <td>136 (83)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No pain</td>
                <td>66 (16)</td>
                <td>27 (17)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup><italic>P</italic> values for numerical values (age) and categorical features (primary cancer site and bone metastasis lesion type) were calculated using a 2-tailed heteroscedastic <italic>t</italic> test and a chi-square test, respectively.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>N/A: not applicable.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>The <italic>P</italic> value for the age difference between males and females was .20 for the training and validation set and .50 for the test set.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>NLP-Extracted Pain Labels</title>
        <p>Due to the absence of patient-reported pain scores in our Oncology Information System, we extracted physician-reported pain scores from patients' radiation oncology consultation notes using our previously reported NLP pipeline [<xref ref-type="bibr" rid="ref25">25</xref>]. While pain scores were typically reported as part of the “history of the present illness” in our hospital, for the sake of generalizability, we extracted pain scores from the entire note.</p>
        <p>Our NLP pipeline first processed the text with MetaMap [<xref ref-type="bibr" rid="ref29">29</xref>] and mapped it to the UMLS (ie, Unified Medical Language System) Metathesaurus [<xref ref-type="bibr" rid="ref30">30</xref>] in order to identify pain terminologies and their severity scores. Next, it applied rules to filter out hypothetical, conditional, and historical references to pain in order to focus solely on references to pain at the time of the consultation. Then, it calculated the average pain intensity (API) in each note by averaging the pain scores therein. Finally, it assigned each note a “verbally declared pain” (VDP) label, as VDP=“no pain” (if API 0), and VDP=“pain” (if API0). These pain labels were used to train, validate, and test our radiomics model.</p>
      </sec>
      <sec>
        <title>Expert-Extracted Pain Scores</title>
        <p>To evaluate the effect of NLP-extracted pain labels on the performance of our pipeline, we also generated best-available ground-truth pain labels using expert-annotated pain scores. To do so, our radiation oncologists used the texTRACTOR [<xref ref-type="bibr" rid="ref31">31</xref>] pain labeling application to manually read consultation notes and label valid pain scores in our training and test data sets using a 4-grade verbal rating scale (no pain, mild, moderate, and severe). A mention of pain was regarded as valid if it reflected the status of pain at the metastatic sites for which treatment was planned at the time of the consultation. Table A1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> contains all the NLP- and expert-extracted pain scores, and Figure A2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> illustrates the level of agreement between them. Due to the quality of the documented pain scores and lack of interrater agreement among experts (Fleiss κ=0.43), as explained by Naseri et al [<xref ref-type="bibr" rid="ref25">25</xref>], we subsequently defined a binary pain score as “no pain” and “pain” in order to establish satisfactory interrater agreement (κ=0.66) [<xref ref-type="bibr" rid="ref25">25</xref>]. To create binary ground-truth pain labels comparable to the NLP-extracted labels, we assigned notes scored as “no pain” to “no pain” and notes scored as “mild,” “moderate,” and “severe” pain to “pain.” These expert-extracted pain scores were used to measure how well the NLP pipeline works.</p>
      </sec>
      <sec>
        <title>Center Point Identification of BM Lesions</title>
        <p>BM lesion center points were identified by a team comprising a staff radiation oncologist (SS) with 10 years’ experience, a radiation oncology fellow (MT), and 3 third-year radiation oncology residents (J Khriguian, PR, and MF). Simulation CT DICOM (ie, Digital Imaging and Communications in Medicine) files were exported from the radiotherapy treatment planning software and deidentified. Then, the CT images were randomly divided into 5 sets and loaded into the diCOMBINE [<xref ref-type="bibr" rid="ref32">32</xref>] application for BM lesion center point identification. Our experts were blinded to patients’ pain statuses and identities. We requested each expert to label center points for all visually identifiable BM lesions in all CT images within 1 of the 5 sets, and another expert was assigned to validate their labels. A key benefit of this radiomics pipeline [<xref ref-type="bibr" rid="ref21">21</xref>] is that it does not require full lesion segmentation, making it feasible to engage busy clinicians.</p>
      </sec>
      <sec>
        <title>Segmentation of Regions of Interest</title>
        <p>Using our previously reported methodology [<xref ref-type="bibr" rid="ref21">21</xref>], we automatically segmented lesion center point–based nested spherical (SP) regions of interest (ROIs). To do this, we first delineated nested spherical ROIs around the identified BM lesion center points (see <xref ref-type="boxed-text" rid="box1">Textbox 1</xref>, top panel). ROI diameters ranged from 7 mm (3×3 voxels) to 50 mm (average size of the vertebral body) [<xref ref-type="bibr" rid="ref33">33</xref>]. Then, in addition to what was reported by Naseri et al [<xref ref-type="bibr" rid="ref21">21</xref>], we used Hounsfield units thresholding to exclude fat and air regions from the delineated ROIs. For this, motivated by Deglint et al [<xref ref-type="bibr" rid="ref34">34</xref>] and Ulano et al [<xref ref-type="bibr" rid="ref35">35</xref>], we applied a threshold to remove voxels with negative Hounsfield units from our ROIs. Hounsfield units of &#60;0 are associated with fat and air [<xref ref-type="bibr" rid="ref34">34</xref>]. We used OpenCV [<xref ref-type="bibr" rid="ref36">36</xref>] (version 4.4.0) for Hounsfield units thresholding and applied a Gaussian filter to reduce noise. Then, we used pynrrd [<xref ref-type="bibr" rid="ref37">37</xref>] (version 0.4.2) to export each ROI as a 3D binary mask and store it as a.nrrd [<xref ref-type="bibr" rid="ref38">38</xref>] file. Finally, we aggregated these nested ROI masks to form ensemble ROIs. In this study, we examined 2 contrasting ensemble (EN) ROIs as shown in <xref ref-type="boxed-text" rid="box1">Textbox 1</xref> (bottom panel): one with small size and 3 layers (EN3) and the other with large size and 6 layers (EN6). Wakabayashi et al [<xref ref-type="bibr" rid="ref13">13</xref>] and Naseri et al [<xref ref-type="bibr" rid="ref21">21</xref>] have shown that radiomics-based machine learning models trained on ensemble ROIs have better classification performance than single ROI–based models.</p>
        <boxed-text id="box1" position="float">
          <title>The characteristics of the spherical and ensemble regions of interest (ROIs) used in this study.</title>
          <p>Nested spherical (SP) ROIs with Hounsfield units (HUs) intensity thresholds (HU&#62;0):</p>
          <list list-type="bullet">
            <list-item>
              <p>SP7 (diameter 7 mm)</p>
            </list-item>
            <list-item>
              <p>SP10 (diameter 10 mm)</p>
            </list-item>
            <list-item>
              <p>SP15 (diameter 15 mm)</p>
            </list-item>
            <list-item>
              <p>SP20 (diameter 20 mm)</p>
            </list-item>
            <list-item>
              <p>SP30 (diameter 30 mm)</p>
            </list-item>
            <list-item>
              <p>SP50 (diameter 50 mm)</p>
            </list-item>
          </list>
          <p>Ensemble (EN) ROIs:</p>
          <list list-type="bullet">
            <list-item>
              <p>EN3 (ROI SP7+SP10+SP15)</p>
            </list-item>
            <list-item>
              <p>EN6 (ROI SP7+SP10+SP15+SP20+SP30+SP50)</p>
            </list-item>
          </list>
        </boxed-text>
      </sec>
      <sec>
        <title>Radiomics Models</title>
        <p>Our radiomics pipeline is illustrated in <xref rid="figure2" ref-type="fig">Figure 2</xref>. We essentially used our previously reported pipeline [<xref ref-type="bibr" rid="ref21">21</xref>] but with our NLP- and expert-extracted pain labels to train and test it. We made one improvement to the pipeline by incorporating Imbalanced-learn [<xref ref-type="bibr" rid="ref39">39</xref>] (version 0.7.0) as a resampling step to account for imbalance (see below).</p>
        <p>Radiomics features were extracted from each CT image using masks composed of the ensemble ROIs listed in <xref ref-type="boxed-text" rid="box1">Textbox 1</xref>. Then, the feature space was scaled using <italic>z</italic> score normalization [<xref ref-type="bibr" rid="ref40">40</xref>], and the associated NLP-extracted binary pain labels (pain=1, no pain=0) were incorporated. A single NLP-extracted pain score was assigned to all the lesions extracted from a given paired CT image.</p>
        <p>Due to the nature of BM pain [<xref ref-type="bibr" rid="ref41">41</xref>], there was a large imbalance between the number of painful and painless lesions (493 pain, 93 no pain). Therefore, we used the Synthetic Minority Oversampling Technique (SMOTE) [<xref ref-type="bibr" rid="ref42">42</xref>] in the training phase as it has been shown to be the best-performing resampling method for radiomics [<xref ref-type="bibr" rid="ref43">43</xref>]. We did not apply resampling to our test set in order to maintain the original sample imbalance. Then, the Least Absolute Shrinkage And Selection Operator [<xref ref-type="bibr" rid="ref44">44</xref>] feature selection method was applied to the feature space to remove noninformative features. Least Absolute Shrinkage And Selection Operator is a commonly used feature selection method in radiomics studies [<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref46">46</xref>]. Finally, we examined the Gaussian process regression, linear support vector machine, random forest, and neural networks classifiers, as they were the best performing machine learning classifiers in our previous work. We evaluated the performance of our models on the training set using 5-fold cross-validation. Final evaluation was performed on the test set. The receiver operating characteristic (ROC) [<xref ref-type="bibr" rid="ref47">47</xref>] curve, area under the ROC curve (AUC), precision, sensitivity, specificity, and <italic>F</italic><sub>1</sub>-score metrics were used to report the performance of our models on the training and test sets. We also trained and tested our best performing pipeline using the expert-extracted pain scores (best-available ground-truth) to evaluate the impact of NLP-extracted pain labels.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>The radiomics-based pipeline that we used to select and train a machine learning model to separate painful and painless bone metastasis lesions. Our pipeline is the same as that published by Naseri et al [<xref ref-type="bibr" rid="ref21">21</xref>] but using NLP-extracted pain labels and modified to account for sample imbalance. AUC-ROC: area under the receiver operating characteristic curve-receiver operating characteristic; CT: computed tomography; GPR: Gaussian process regression; LASSO: Least Absolute Shrinkage And Selection Operator; L-SVM: linear support vector machine; ML: machine learning; NLP: natural language processing; NNet: neural network; RF: random forest; ROI: region of interest; SMOTE: Synthetic Minority Oversampling Technique.</p>
          </caption>
          <graphic xlink:href="ai_v2i1e44779_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Patient Demographics</title>
        <p>A total of 176 pairs of radiotherapy consultation notes and simulation CT images of patients with thoracic spinal BM were included in this study. As summarized in <xref ref-type="table" rid="table1">Table 1</xref>, a total of 121 sample pairs (mean patient age 63, SD 14 years; males: n=65, mean age 67, SD 14 years; <italic>P</italic>=.20) were included for training and cross-validation, and 55 sample pairs (mean patient age 64, SD 12 years; males: n=25, mean age 64, SD 13 years; females: mean age 64, SD 23 years; <italic>P</italic>=.50) were included in the test set. The sample selection procedure and data quantities are presented in <xref rid="figure1" ref-type="fig">Figure 1</xref>. The demographics of the patients in the training and test sets are presented in <xref ref-type="table" rid="table1">Table 1</xref>. The most common primary cancer sites were the lungs (n=52), breasts (n=34), and prostate (n=24).</p>
        <p>A total of 586 BM center points were identified by our experts on the training (n=423 lesions) and test (n=163 lesions) data sets. In the training set, 357 (84%) lesions were labeled by the NLP pipeline as painful and 66 lesions were labeled as painless. In the test set, 136 (83%) lesions were identified by the NLP pipeline as painful, and 27 lesions were labeled as painless. This represented a significant but equal imbalance in our training and test sets.</p>
      </sec>
      <sec>
        <title>Segmented ROIs</title>
        <p>Examples of segmented ROIs with the Hounsfield units threshold applied are presented in <xref rid="figure3" ref-type="fig">Figure 3</xref> for painful and painless BMs.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Examples of segmented nested spherical regions of interest (ROIs) with the Hounsfield units threshold applied on computed tomography images of patients with painful (A, B) and painless (C, D) bone metastases lesions. Nested ROIs with diameters of 50, 30, 20, 15, 10, and 7 mm are shown in the insets as different hues.</p>
          </caption>
          <graphic xlink:href="ai_v2i1e44779_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Testing Our Radiomics Models</title>
        <p>In total, 107 radiomics features were extracted from each of the 6 nested ROIs. Then, they were aggregated to form feature spaces for the EN3 (with 321 features) and EN6 (with 642 features) ensemble ROIs. <xref rid="figure4" ref-type="fig">Figure 4</xref> shows the ROC curve of each model in the training (black lines) and test (red squares) data sets using the EN3 and EN6 ROIs. On the training set, the gray range represents the mean (SD) AUC of the 5-fold cross-validation. The AUC and <italic>F</italic><sub>1</sub>-score grids are presented in <xref ref-type="table" rid="table2">Table 2</xref>.</p>
        <p>The precision, accuracy, sensitivity, specificity, <italic>F</italic><sub>1</sub>-score, and AUC values of our best-performing pipeline (neural networks with the EN6 ROI) are presented in <xref ref-type="table" rid="table3">Table 3</xref>. The performance of this pipeline (trained and tested) on the data set of expert-extracted pain labels (best-available ground-truth) is provided as a quality measurement. The performance of the model described previously by Wakabayashi et al [<xref ref-type="bibr" rid="ref13">13</xref>] is also provided for comparison.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Receiver operating characteristic curves for our classifiers using 3-layer ensemble (EN3) (top row) and 6-layer ensemble (EN6) (bottom row) lesion center point–based ensemble regions of interest in training (black lines) and test (dark red squares) data sets. AUC: area under the receiver operating characteristic curve; GPR: Gaussian process regression; L-SVM: linear support vector machine; NNet: neural network; RF: random forest.</p>
          </caption>
          <graphic xlink:href="ai_v2i1e44779_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>The area under the receiver operating characteristic curves (AUCs) and <italic>F</italic><sub>1</sub>-scores of our machine learning classifiers in the training and test data sets using the ensemble (EN) regions of interest EN3 and EN6 for each of the RF (random forest), GPR (Gaussian process regression), L-SVM (linear support vector machine), and NNet (neural networks) classifiers.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="0"/>
            <col width="110"/>
            <col width="110"/>
            <col width="100"/>
            <col width="100"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Region of interest</td>
                <td colspan="5">Training set</td>
                <td colspan="4">Test set</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <break/>
                </td>
                <td>RF</td>
                <td>GPR</td>
                <td>L-SVM</td>
                <td>NNet</td>
                <td colspan="2">RF</td>
                <td>GPR</td>
                <td>L-SVM</td>
                <td>NNet</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="11">
                  <bold>Areas under the receiver operating characteristic curve</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>EN3</td>
                <td>98.3</td>
                <td>98.1</td>
                <td>84.7</td>
                <td>94.6</td>
                <td colspan="2">67.3</td>
                <td>72.1</td>
                <td>75.2</td>
                <td>73.3</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>EN6</td>
                <td>98.1</td>
                <td>98.3</td>
                <td>89.8</td>
                <td>94.0</td>
                <td colspan="2">74.1</td>
                <td>80.6</td>
                <td>82.4</td>
                <td>82.5</td>
              </tr>
              <tr valign="top">
                <td colspan="11">
                  <bold><italic>F</italic><sub>1</sub>-scores</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>EN3</td>
                <td>90.0</td>
                <td>89.9</td>
                <td>79.4</td>
                <td>90.5</td>
                <td colspan="2">60.9</td>
                <td>64.7</td>
                <td>65.4</td>
                <td>63.6</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>EN6</td>
                <td>93.0</td>
                <td>93.0</td>
                <td>84.7</td>
                <td>91.6</td>
                <td colspan="2">63.8</td>
                <td>66.9</td>
                <td>67.4</td>
                <td>69.5</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>The performance of our best-performing natural language processing (NLP)–radiomics pipeline (neural networks with the ensemble 6 region of interest) on the training and test sets using NLP and manually extracted pain labels, together with the results from a prior study by Wakabayashi et al [<xref ref-type="bibr" rid="ref13">13</xref>].</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="350"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="100"/>
            <col width="110"/>
            <thead>
              <tr valign="bottom">
                <td>
                  <break/>
                </td>
                <td>Accuracy</td>
                <td>Precision</td>
                <td>Sensitivity</td>
                <td>Specificity</td>
                <td><italic>F</italic><sub>1</sub>-score</td>
                <td>AUC<sup>a</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>This study (training set)</td>
                <td>92.4</td>
                <td>93.2</td>
                <td>92.4</td>
                <td>86.4</td>
                <td>91.6</td>
                <td>94.0</td>
              </tr>
              <tr valign="top">
                <td>This study (test set)</td>
                <td>81.0</td>
                <td>67.9</td>
                <td>59.2</td>
                <td>85.3</td>
                <td>69.5</td>
                <td>82.5</td>
              </tr>
              <tr valign="top">
                <td>This study (training set); using manual pain scores</td>
                <td>94.2</td>
                <td>94.8</td>
                <td>98.7</td>
                <td>89.7</td>
                <td>94.4</td>
                <td>98.1</td>
              </tr>
              <tr valign="top">
                <td>This study (test set); using manual pain scores</td>
                <td>83.5</td>
                <td>64.9</td>
                <td>64.7</td>
                <td>85.7</td>
                <td>68.0</td>
                <td>82.3</td>
              </tr>
              <tr valign="top">
                <td>Wakabayashi et al [<xref ref-type="bibr" rid="ref13">13</xref>] (training test only)</td>
                <td>73.9</td>
                <td>—<sup>b</sup></td>
                <td>71.0</td>
                <td>86.0</td>
                <td>—</td>
                <td>82.0</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>AUC: area under the receiver operating characteristic curve.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>Not determined.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <p>Underestimation and undertreatment of cancer pain can significantly diminish the quality of life of patients with cancer. Accordingly, systems that can objectively measure cancer pain have the potential to improve quality of life. In this study, we created a scalable NLP-radiomics pain identification pipeline. Our pipeline is designed for palliative treatment for patients with cancer undergoing radiotherapy therapy, for whom there are typically just 2 contemporaneous sources of relevant medical information at the time of the treatment: consultation notes and simulation CT images. We used an NLP pipeline to extract physician-reported pain scores from radiotherapy consultation notes. NLP-extracted pain scores are appropriate, when structured patient-reported pain scores are unavailable (as is the case for at least 25% to 35% of all patients with cancer [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref48">48</xref>] and for all patients with cancer receiving palliative care who are treated with radiotherapy at our institution at the time the data were used in this study). Our lesion center point–based spherical ROI delineation method significantly sped up the ROI segmentation procedure, enabling us to rapidly delineate BM center points in 176 images in this study. For comparison, the radiomics pipeline that was developed by Wakabayashi et al [<xref ref-type="bibr" rid="ref13">13</xref>] required full 3D segmentation of each ROI (69 images).</p>
      <p>Due to the unbalanced nature of BM pain, our data set contained significantly fewer “no pain” samples. In order to better train our models, we applied SMOTE resampling to the training set to balance the number of samples with the NLP-extracted “pain” and “no pain” labels. We did not apply any resampling techniques to our test (hold out) set to maintain the original sample imbalance. Therefore, while our training set was balanced, our test set had 5 times more “pain” cases than “no pain” cases (136 pain versus 27 no pain cases). This caused a significant change in the pipeline’s performance between the training and test sets. It has been shown that oversampling improves the overall performance of machine learning models, but the effect is stronger on the training set due to the inclusion of replicated samples in the cross-validation subsets [<xref ref-type="bibr" rid="ref49">49</xref>]. Moreover, the imbalance in our test set led to high specificity (ability to properly identify pain instances) and low sensitivity (ability to correctly identify no pain cases) in the performance evaluation. For comparison, the sample imbalance reported by Wakabayashi et al [<xref ref-type="bibr" rid="ref13">13</xref>] was 2:1, resulting in a more balanced relationship between the sensitivity and specificity of their model.</p>
      <p>The performance of our pipeline did not improve much when we trained and tested it using expert-extracted pain labels (best-available ground-truth). This might be the case because, in the first experiment, we both trained and tested our pipeline using NLP-extracted pain labels, and in the second experiment, we both trained and tested our pipeline using expert-extracted pain labels. Consequently, after being trained with one set of labels (NLP- or expert-extracted), our pipeline performed well on the test set that was labeled using the same method (NLP or expert). We also demonstrated that our pipeline’s performance is comparable to that of Wakabayashi et al [<xref ref-type="bibr" rid="ref13">13</xref>], who achieved their results using patient-reported pain labels.</p>
      <p>Our pipeline performed significantly better on the EN6 ROIs than on the EN3 ROIs. This could be the case because in comparison to EN3, our EN6 ROIs include additional ROIs with sizes of 20, 30, and 50 mm. From visual inspection, we suspect that, in addition to the characteristics of the BM lesion itself, its location (eg, its proximity to the spinal cord) may be a significant contributor to the BM pain. As a result, larger ROIs enable our algorithm to extract characteristics from outside the BM lesion. Wakabayashi et al [<xref ref-type="bibr" rid="ref13">13</xref>] also demonstrated the effectiveness of using ROIs outside of the BM lesion.</p>
      <p>We are unable to offer a convincing explanation as to why neural networks outperformed random forest and support vector machine classifiers in our analysis. Notwithstanding, it has been demonstrated that neural network classifiers perform better when applied to more difficult problems and larger data sets, while random forest and support vector machine classifiers typically perform well with smaller data sets [<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref51">51</xref>].</p>
      <p>Our pipeline was successful in extracting radiomics biomarkers capable of distinguishing between painful and painless BM lesions. These biomarkers potentially provide the opportunity to objectively identify clinical pain-related indicators that may aid in the diagnosis, treatment, and understanding of BM pain.</p>
      <p>Our work has several limitations. First, we used data from a single center for this retrospective study. A multicenter study with a larger data set is necessary to assess the generalizability of our radiomics pipeline for pain quantification. We anticipate that the performance of our NLP-radiomics pipeline will vary based on the pain scoring systems of the cohorts tested. Second, by using lesion center point–based geometrical ROIs, we ignored lesion characteristics such as size and shape, which may be important in the context of pain. Although we used Hounsfield units intensity thresholding to preserve some tumor information, we are considering implementing deep learning–based ROI segmentation in the future as it may better account for full tumor and surrounding tissue characteristics. Lastly, we used SMOTE resampling to address the issue of class imbalance. An alternative solution might be to develop cost-sensitive machine learning classifiers that account for the cost of misclassifying minority samples [<xref ref-type="bibr" rid="ref52">52</xref>]. However, there is no clear consensus in the literature on whether cost-sensitive learning outperforms resampling [<xref ref-type="bibr" rid="ref53">53</xref>]. A model that can differentiate between painful and painless lesions from medical imaging is a critical component of any possible radiomics-based pain quantification pipeline. This work not only shows the feasibility of developing a pain quantification tool, but also it removes some of the barriers to its development. As a result, our future work will be to apply our pipeline to patients’ past and current CT images and consultation notes in order to develop a longitudinal model of pain. Such a model should take into account not only images (taken before, during, and after delivering radiotherapy) but also other internal and external parameters that can influence how pain evolves over time (such as primary cancer type, radiation dose, other treatments, and pain medications). Also, it will include patient-reported pain scores to provide more accurate ground-truth pain labels in order to develop a more robust deep learning–based NLP pipeline [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref54">54</xref>]. This, however, is beyond the scope of this investigation.</p>
      <p>In conclusion, we demonstrated that our NLP and radiomics-based machine learning pipeline can effectively differentiate between painful and painless BM lesions in simulation CT images using ensemble lesion center point–based geometrical ROIs. Using NLP-extracted pain labels in conjunction with lesion center point–based radiomics features is time efficient. This helps to pave the way for the development of quickly trained and efficient clinical AI-based decision-making tools that can objectively measure cancer pain. Such a tool may help alleviate the burden of pain management and improve the quality of life of patients with BMs.</p>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Sample data.</p>
        <media xlink:href="ai_v2i1e44779_app1.docx" xlink:title="DOCX File , 103 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">API</term>
          <def>
            <p>average pain intensity</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">AUC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">BM</term>
          <def>
            <p>bone metastasis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">CT</term>
          <def>
            <p>computed tomography</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">EN</term>
          <def>
            <p>ensemble</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">ROC</term>
          <def>
            <p>receiver operating characteristic</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">ROI</term>
          <def>
            <p>region of interest</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">SMOTE</term>
          <def>
            <p>Synthetic Minority Oversampling Technique</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">SP</term>
          <def>
            <p>spherical</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">VDP</term>
          <def>
            <p>verbally declared pain</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This research was supported by the startup grant of J Kildea at the Research Institute of the McGill University Health Centre (RI-MUHC), the Ruth and Alex Dworkin scholarship award from the Faculty of Medicine and Health Sciences at McGill University, an RI-MUHC studentship award, a Grad Excellence Award-00293 from the Department of Physics at McGill University, Fonds de recherche du Québec - Santé (FRQS), and by the CREATE Responsible Health and Healthcare Data Science (SDRDS) grant of the Natural Sciences and Engineering Research Council. The authors would like to thank Dr Luc Galarneau for his help with statistical analysis.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>van den Beuken-van Everdingen</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Hochstenbach</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Joosten</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Tjan-Heijnen</surname>
              <given-names>VC</given-names>
            </name>
            <name name-style="western">
              <surname>Janssen</surname>
              <given-names>DJ</given-names>
            </name>
          </person-group>
          <article-title>Update on prevalence of pain in patients with cancer: systematic review and meta-analysis</article-title>
          <source>J Pain Symptom Manage</source>
          <year>2016</year>
          <month>06</month>
          <volume>51</volume>
          <issue>6</issue>
          <fpage>1070</fpage>
          <lpage>1090.e9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0885-3924(16)30048-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jpainsymman.2015.12.340</pub-id>
          <pub-id pub-id-type="medline">27112310</pub-id>
          <pub-id pub-id-type="pii">S0885-3924(16)30048-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McQuay</surname>
              <given-names>Henry J</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>Sally L</given-names>
            </name>
            <name name-style="western">
              <surname>Carroll</surname>
              <given-names>Dawn</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>R Andrew</given-names>
            </name>
            <name name-style="western">
              <surname>Derry</surname>
              <given-names>Sheena</given-names>
            </name>
          </person-group>
          <article-title>WITHDRAWN: radiotherapy for the palliation of painful bone metastases</article-title>
          <source>Cochrane Database Syst Rev</source>
          <year>2013</year>
          <month>11</month>
          <day>22</day>
          <volume>2013</volume>
          <issue>11</issue>
          <fpage>CD001793</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/24271498"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/14651858.CD001793.pub2</pub-id>
          <pub-id pub-id-type="medline">24271498</pub-id>
          <pub-id pub-id-type="pmcid">PMC6564087</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Grossman</surname>
              <given-names>SA</given-names>
            </name>
          </person-group>
          <article-title>Undertreatment of cancer pain: barriers and remedies</article-title>
          <source>Support Care Cancer</source>
          <year>1993</year>
          <month>3</month>
          <volume>1</volume>
          <issue>2</issue>
          <fpage>74</fpage>
          <lpage>78</lpage>
          <pub-id pub-id-type="doi">10.1007/bf00366899</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cleeland</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Janjan</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Scott</surname>
              <given-names>CB</given-names>
            </name>
            <name name-style="western">
              <surname>Seiferheld</surname>
              <given-names>WF</given-names>
            </name>
            <name name-style="western">
              <surname>Curran</surname>
              <given-names>WJ</given-names>
            </name>
          </person-group>
          <article-title>Cancer pain management by radiotherapists: a survey of radiation therapy oncology group physicians</article-title>
          <source>Int J Radiat Oncol Biol Phys</source>
          <year>2000</year>
          <month>04</month>
          <day>01</day>
          <volume>47</volume>
          <issue>1</issue>
          <fpage>203</fpage>
          <lpage>208</lpage>
          <pub-id pub-id-type="doi">10.1016/s0360-3016(99)00276-x</pub-id>
          <pub-id pub-id-type="medline">10758325</pub-id>
          <pub-id pub-id-type="pii">S0360-3016(99)00276-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tracey</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Woolf</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Andrews</surname>
              <given-names>NA</given-names>
            </name>
          </person-group>
          <article-title>Composite pain biomarker signatures for objective assessment and effective treatment</article-title>
          <source>Neuron</source>
          <year>2019</year>
          <month>03</month>
          <day>06</day>
          <volume>101</volume>
          <issue>5</issue>
          <fpage>783</fpage>
          <lpage>800</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0896-6273(19)30154-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.neuron.2019.02.019</pub-id>
          <pub-id pub-id-type="medline">30844399</pub-id>
          <pub-id pub-id-type="pii">S0896-6273(19)30154-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC6800055</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Objective pain assessment: a key for the management of chronic pain</article-title>
          <source>F1000Res</source>
          <year>2020</year>
          <month>1</month>
          <day>23</day>
          <volume>9</volume>
          <fpage>35</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32047606"/>
          </comment>
          <pub-id pub-id-type="doi">10.12688/f1000research.20441.1</pub-id>
          <pub-id pub-id-type="medline">32047606</pub-id>
          <pub-id pub-id-type="pii">F1000 Faculty Rev-35</pub-id>
          <pub-id pub-id-type="pmcid">PMC6979466</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Niculescu</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Le-Niculescu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Levey</surname>
              <given-names>DF</given-names>
            </name>
            <name name-style="western">
              <surname>Roseberry</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Soe</surname>
              <given-names>KC</given-names>
            </name>
            <name name-style="western">
              <surname>Rogers</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Judd</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>McCormick</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Wessel</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kurian</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>White</surname>
              <given-names>FA</given-names>
            </name>
          </person-group>
          <article-title>Towards precision medicine for pain: diagnostic biomarkers and repurposed drugs</article-title>
          <source>Mol Psychiatry</source>
          <year>2019</year>
          <month>04</month>
          <volume>24</volume>
          <issue>4</issue>
          <fpage>501</fpage>
          <lpage>522</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30755720"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41380-018-0345-5</pub-id>
          <pub-id pub-id-type="medline">30755720</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41380-018-0345-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC6477790</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Diaz</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Caylor</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Strigo</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Lerman</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Henry</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lopez</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Wallace</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Ellis</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Simmons</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Keltner</surname>
              <given-names>JR</given-names>
            </name>
          </person-group>
          <article-title>Toward composite pain biomarkers of neuropathic pain-focus on peripheral neuropathic pain</article-title>
          <source>Front Pain Res (Lausanne)</source>
          <year>2022</year>
          <month>5</month>
          <day>11</day>
          <volume>3</volume>
          <fpage>869215</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35634449"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fpain.2022.869215</pub-id>
          <pub-id pub-id-type="medline">35634449</pub-id>
          <pub-id pub-id-type="pmcid">PMC9130475</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Furfari</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wan</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Bezjak</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>CF</given-names>
            </name>
            <name name-style="western">
              <surname>DeAngelis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Azad</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chow</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Charames</surname>
              <given-names>GS</given-names>
            </name>
          </person-group>
          <article-title>Genetic biomarkers associated with pain flare and dexamethasone response following palliative radiotherapy in patients with painful bone metastases</article-title>
          <source>Ann Palliat Med</source>
          <year>2017</year>
          <month>12</month>
          <volume>6</volume>
          <issue>Suppl 2</issue>
          <fpage>S240</fpage>
          <lpage>S247</lpage>
          <pub-id pub-id-type="doi">10.21037/apm.2017.09.04</pub-id>
          <pub-id pub-id-type="medline">29156912</pub-id>
          <pub-id pub-id-type="pii">apm.2017.09.04</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gunn</surname>
              <given-names>Joshua</given-names>
            </name>
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>Melissa M</given-names>
            </name>
            <name name-style="western">
              <surname>Cotten</surname>
              <given-names>Bradley M</given-names>
            </name>
            <name name-style="western">
              <surname>Deer</surname>
              <given-names>Timothy R</given-names>
            </name>
          </person-group>
          <article-title>An analysis of biomarkers in patients with chronic pain</article-title>
          <source>Pain Physician</source>
          <year>2020</year>
          <month>01</month>
          <volume>23</volume>
          <issue>1</issue>
          <fpage>E41</fpage>
          <lpage>E49</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.painphysicianjournal.com/linkout?issn=&#38;vol=23&#38;page=E41"/>
          </comment>
          <pub-id pub-id-type="medline">32013287</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Marchi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Vellucci</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mameli</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rita Piredda</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Finco</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Pain biomarkers</article-title>
          <source>Clinical Drug Investigation</source>
          <year>2009</year>
          <volume>29</volume>
          <issue>Supplement 1</issue>
          <fpage>41</fpage>
          <lpage>46</lpage>
          <pub-id pub-id-type="doi">10.2165/0044011-200929001-00006</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ota</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Connolly</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Srinivasan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Capizzano</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Moritani</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Mechanisms and origins of spinal pain: from molecules to anatomy, with diagnostic clues and imaging findings</article-title>
          <source>Radiographics</source>
          <year>2020</year>
          <month>07</month>
          <volume>40</volume>
          <issue>4</issue>
          <fpage>1163</fpage>
          <lpage>1181</lpage>
          <pub-id pub-id-type="doi">10.1148/rg.2020190185</pub-id>
          <pub-id pub-id-type="medline">32501739</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wakabayashi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Koide</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Aoyama</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Shimizu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Miyauchi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tanaka</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tachibana</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Nakamura</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kodaira</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>A predictive model for pain response following radiotherapy for treatment of spinal metastases</article-title>
          <source>Sci Rep</source>
          <year>2021</year>
          <month>06</month>
          <day>18</day>
          <volume>11</volume>
          <issue>1</issue>
          <fpage>12908</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-021-92363-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-021-92363-0</pub-id>
          <pub-id pub-id-type="medline">34145367</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-021-92363-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC8213735</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carlson</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Hooten</surname>
              <given-names>WM</given-names>
            </name>
          </person-group>
          <article-title>Pain-linguistics and natural language processing</article-title>
          <source>Mayo Clin Proc Innov Qual Outcomes</source>
          <year>2020</year>
          <month>06</month>
          <volume>4</volume>
          <issue>3</issue>
          <fpage>346</fpage>
          <lpage>347</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2542-4548(20)30032-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.mayocpiqo.2020.01.005</pub-id>
          <pub-id pub-id-type="medline">32542226</pub-id>
          <pub-id pub-id-type="pii">S2542-4548(20)30032-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC7283550</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dave</surname>
              <given-names>Amisha D</given-names>
            </name>
            <name name-style="western">
              <surname>Ruano</surname>
              <given-names>Gualberto</given-names>
            </name>
            <name name-style="western">
              <surname>Kost</surname>
              <given-names>Jonathan</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Xiaoyan</given-names>
            </name>
          </person-group>
          <article-title>Automated extraction of pain symptoms: a natural language approach using electronic health records</article-title>
          <source>Pain Physician</source>
          <year>2022</year>
          <month>03</month>
          <volume>25</volume>
          <issue>2</issue>
          <fpage>E245</fpage>
          <lpage>E254</lpage>
          <pub-id pub-id-type="medline">35322976</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tighe</surname>
              <given-names>Patrick J</given-names>
            </name>
            <name name-style="western">
              <surname>Sannapaneni</surname>
              <given-names>Bharadwaj</given-names>
            </name>
            <name name-style="western">
              <surname>Fillingim</surname>
              <given-names>Roger B</given-names>
            </name>
            <name name-style="western">
              <surname>Doyle</surname>
              <given-names>Charlie</given-names>
            </name>
            <name name-style="western">
              <surname>Kent</surname>
              <given-names>Michael</given-names>
            </name>
            <name name-style="western">
              <surname>Shickel</surname>
              <given-names>Ben</given-names>
            </name>
            <name name-style="western">
              <surname>Rashidi</surname>
              <given-names>Parisa</given-names>
            </name>
          </person-group>
          <article-title>Forty-two million ways to describe pain: topic modeling of 200,000 PubMed pain-related abstracts using natural language processing and deep learning-based text generation</article-title>
          <source>Pain Med</source>
          <year>2020</year>
          <month>11</month>
          <day>01</day>
          <volume>21</volume>
          <issue>11</issue>
          <fpage>3133</fpage>
          <lpage>3160</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32249306"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/pm/pnaa061</pub-id>
          <pub-id pub-id-type="medline">32249306</pub-id>
          <pub-id pub-id-type="pii">5816322</pub-id>
          <pub-id pub-id-type="pmcid">PMC7685694</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Matsangidou</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liampas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pittara</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pattichi</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Zis</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Machine learning in pain medicine: an up-to-date systematic review</article-title>
          <source>Pain Ther</source>
          <year>2021</year>
          <month>12</month>
          <day>26</day>
          <volume>10</volume>
          <issue>2</issue>
          <fpage>1067</fpage>
          <lpage>1084</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34568998"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s40122-021-00324-2</pub-id>
          <pub-id pub-id-type="medline">34568998</pub-id>
          <pub-id pub-id-type="pii">10.1007/s40122-021-00324-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC8586126</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Neijenhuijs</surname>
              <given-names>KI</given-names>
            </name>
            <name name-style="western">
              <surname>Peeters</surname>
              <given-names>CFW</given-names>
            </name>
            <name name-style="western">
              <surname>van Weert</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Cuijpers</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Leeuw</surname>
              <given-names>IV</given-names>
            </name>
          </person-group>
          <article-title>Symptom clusters among cancer survivors: what can machine learning techniques tell us?</article-title>
          <source>BMC Med Res Methodol</source>
          <year>2021</year>
          <month>08</month>
          <day>16</day>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>166</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/s12874-021-01352-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12874-021-01352-4</pub-id>
          <pub-id pub-id-type="medline">34399698</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12874-021-01352-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC8369803</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nam</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Pak</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Development and validation of a radiomics model for differentiating bone islands and osteoblastic bone metastases at abdominal CT</article-title>
          <source>Radiology</source>
          <year>2021</year>
          <month>06</month>
          <volume>299</volume>
          <issue>3</issue>
          <fpage>626</fpage>
          <lpage>632</lpage>
          <pub-id pub-id-type="doi">10.1148/radiol.2021203783</pub-id>
          <pub-id pub-id-type="medline">33787335</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hao</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>A CT-based radiomics nomogram for distinguishing between benign and malignant bone tumours</article-title>
          <source>Cancer Imaging</source>
          <year>2021</year>
          <month>02</month>
          <day>06</day>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>20</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cancerimagingjournal.biomedcentral.com/articles/10.1186/s40644-021-00387-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s40644-021-00387-6</pub-id>
          <pub-id pub-id-type="medline">33549151</pub-id>
          <pub-id pub-id-type="pii">10.1186/s40644-021-00387-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC7866630</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Naseri</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Skamene</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tolba</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Faye</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Ramia</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Khriguian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Patrick</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Andrade Hernandez</surname>
              <given-names>AX</given-names>
            </name>
            <name name-style="western">
              <surname>David</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kildea</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Radiomics-based machine learning models to distinguish between metastatic and healthy bone using lesion-center-based geometric regions of interest</article-title>
          <source>Sci Rep</source>
          <year>2022</year>
          <month>06</month>
          <day>14</day>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>9866</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-022-13379-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-022-13379-8</pub-id>
          <pub-id pub-id-type="medline">35701461</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-022-13379-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC9198102</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mashayekhi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Parekh</surname>
              <given-names>VS</given-names>
            </name>
            <name name-style="western">
              <surname>Faghih</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>VK</given-names>
            </name>
            <name name-style="western">
              <surname>Jacobs</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Zaheer</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Radiomic features of the pancreas on CT imaging accurately differentiate functional abdominal pain, recurrent acute pancreatitis, and chronic pancreatitis</article-title>
          <source>Eur J Radiol</source>
          <year>2020</year>
          <month>02</month>
          <volume>123</volume>
          <fpage>108778</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31846864"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ejrad.2019.108778</pub-id>
          <pub-id pub-id-type="medline">31846864</pub-id>
          <pub-id pub-id-type="pii">S0720-048X(19)30428-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC7968044</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vedantam</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hassan</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Kotrotsou</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hassan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zinn</surname>
              <given-names>PO</given-names>
            </name>
            <name name-style="western">
              <surname>Viswanathan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Colen</surname>
              <given-names>RR</given-names>
            </name>
          </person-group>
          <article-title>Magnetic resonance-based radiomic analysis of radiofrequency lesion predicts outcomes after percutaneous cordotomy: a feasibility study</article-title>
          <source>Oper Neurosurg (Hagerstown)</source>
          <year>2020</year>
          <month>06</month>
          <day>01</day>
          <volume>18</volume>
          <issue>6</issue>
          <fpage>721</fpage>
          <lpage>727</lpage>
          <pub-id pub-id-type="doi">10.1093/ons/opz288</pub-id>
          <pub-id pub-id-type="medline">31665446</pub-id>
          <pub-id pub-id-type="pii">5607417</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>BERT: pre-training of deep bidirectional transformers for language understanding</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online October 11, 2018</comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1810.04805</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Naseri</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kafi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Skamene</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tolba</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Faye</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Ramia</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Khriguian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kildea</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Development of a generalizable natural language processing pipeline to extract physician-reported pain from clinical reports: Generated using publicly-available datasets and tested on institutional clinical reports for cancer patients with bone metastases</article-title>
          <source>J Biomed Inform</source>
          <year>2021</year>
          <month>08</month>
          <volume>120</volume>
          <fpage>103864</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(21)00193-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2021.103864</pub-id>
          <pub-id pub-id-type="medline">34265451</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(21)00193-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Elbattah</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Arnaud</surname>
              <given-names>É</given-names>
            </name>
            <name name-style="western">
              <surname>Gignon</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dequen</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>The role of text analytics in healthcare: a review of recent developments and applications</article-title>
          <year>2021</year>
          <conf-name>14th International Joint Conference on Biomedical Engineering Systems and Technologies - Scale-IT-up</conf-name>
          <conf-date>February 11-13, 2021</conf-date>
          <conf-loc>Online</conf-loc>
          <pub-id pub-id-type="doi">10.5220/0010414508250832</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>TMF</given-names>
            </name>
            <name name-style="western">
              <surname>Cochran</surname>
              <given-names>WG</given-names>
            </name>
          </person-group>
          <article-title>Sampling techniques, second edition</article-title>
          <source>Applied Statistics</source>
          <year>1964</year>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>54</fpage>
          <pub-id pub-id-type="doi">10.2307/2985224</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Freedman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Pisani</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Purves</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <source>Statistics: Fourth International Student Edition</source>
          <year>2007</year>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>W.W. Norton &#38; Company</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aronson</surname>
              <given-names>A R</given-names>
            </name>
          </person-group>
          <article-title>Effective mapping of biomedical text to the UMLS Metathesaurus: the MetaMap program</article-title>
          <source>Proc AMIA Symp</source>
          <year>2001</year>
          <fpage>17</fpage>
          <lpage>21</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/11825149"/>
          </comment>
          <pub-id pub-id-type="medline">11825149</pub-id>
          <pub-id pub-id-type="pii">D010001275</pub-id>
          <pub-id pub-id-type="pmcid">PMC2243666</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McCray</surname>
              <given-names>A T</given-names>
            </name>
            <name name-style="western">
              <surname>Aronson</surname>
              <given-names>A R</given-names>
            </name>
            <name name-style="western">
              <surname>Browne</surname>
              <given-names>A C</given-names>
            </name>
            <name name-style="western">
              <surname>Rindflesch</surname>
              <given-names>T C</given-names>
            </name>
            <name name-style="western">
              <surname>Razi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Srinivasan</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>UMLS knowledge for biomedical language processing</article-title>
          <source>Bull Med Libr Assoc</source>
          <year>1993</year>
          <month>04</month>
          <volume>81</volume>
          <issue>2</issue>
          <fpage>184</fpage>
          <lpage>194</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/8472004"/>
          </comment>
          <pub-id pub-id-type="medline">8472004</pub-id>
          <pub-id pub-id-type="pmcid">PMC225761</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="web">
          <article-title>hn617/texTRACTOR: texTRACTOR</article-title>
          <source>Zenodo</source>
          <year>2021</year>
          <access-date>2023-04-18</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://zenodo.org/record/4649625">https://zenodo.org/record/4649625</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <article-title>hn617/diCOMBINE: diCOMBINE</article-title>
          <source>Zenodo</source>
          <year>2021</year>
          <access-date>2023-04-18</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://zenodo.org/record/5218743">https://zenodo.org/record/5218743</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Busscher</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Ploegmakers</surname>
              <given-names>JJW</given-names>
            </name>
            <name name-style="western">
              <surname>Verkerke</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Veldhuizen</surname>
              <given-names>AG</given-names>
            </name>
          </person-group>
          <article-title>Comparative anatomical dimensions of the complete human and porcine spine</article-title>
          <source>Eur Spine J</source>
          <year>2010</year>
          <month>07</month>
          <day>26</day>
          <volume>19</volume>
          <issue>7</issue>
          <fpage>1104</fpage>
          <lpage>1114</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/20186441"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s00586-010-1326-9</pub-id>
          <pub-id pub-id-type="medline">20186441</pub-id>
          <pub-id pub-id-type="pmcid">PMC2900026</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Deglint</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Rangayyan</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Ayres</surname>
              <given-names>FJ</given-names>
            </name>
            <name name-style="western">
              <surname>Boag</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Zuffo</surname>
              <given-names>MK</given-names>
            </name>
          </person-group>
          <article-title>Three-dimensional segmentation of the tumor in computed tomographic images of neuroblastoma</article-title>
          <source>J Digit Imaging</source>
          <year>2006</year>
          <month>8</month>
          <day>25</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>72</fpage>
          <lpage>87</lpage>
          <pub-id pub-id-type="doi">10.1007/10278-006-0769-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ulano</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bredella</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Burke</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chebib</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Simeone</surname>
              <given-names>FJ</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Torriani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>CY</given-names>
            </name>
          </person-group>
          <article-title>Distinguishing untreated osteoblastic metastases from enostoses using CT attenuation measurements</article-title>
          <source>Am J Roentgenol</source>
          <year>2016</year>
          <month>08</month>
          <volume>207</volume>
          <issue>2</issue>
          <fpage>362</fpage>
          <lpage>368</lpage>
          <pub-id pub-id-type="doi">10.2214/ajr.15.15559</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="web">
          <article-title>Smoothing Images</article-title>
          <source>OpenCV</source>
          <access-date>2023-09-18</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://docs.opencv.org/4.x/d4/d13/tutorial_py_filtering.html">https://docs.opencv.org/4.x/d4/d13/tutorial_py_filtering.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="web">
          <article-title>mhe/pynrrd: v0.4.3 Released</article-title>
          <source>Zenodo</source>
          <year>2022</year>
          <access-date>2023-04-18</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://zenodo.org/record/6501810">https://zenodo.org/record/6501810</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="web">
          <source>Nearly Raw Raster Data</source>
          <access-date>2022-09-04</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://teem.sourceforge.net/nrrd/index.html">http://teem.sourceforge.net/nrrd/index.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lemaître</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Nogueira</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Aridas</surname>
              <given-names>CK</given-names>
            </name>
          </person-group>
          <article-title>Imbalanced-learn: A Python Toolbox to Tackle the Curse of Imbalanced Datasets in Machine Learning</article-title>
          <source>J Mach Learn Res</source>
          <year>2017</year>
          <volume>18</volume>
          <fpage>1</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jmlr.org/papers/volume18/16-365/16-365.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Low</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Review of Understanding Basic Statistics</article-title>
          <source>Am Stat</source>
          <year>1998</year>
          <volume>52</volume>
          <issue>2</issue>
          <fpage>198</fpage>
          <pub-id pub-id-type="doi">10.2307/2685480</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Torvik</surname>
              <given-names>Karin</given-names>
            </name>
            <name name-style="western">
              <surname>Hølen</surname>
              <given-names>Jacob</given-names>
            </name>
            <name name-style="western">
              <surname>Kaasa</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kirkevold</surname>
              <given-names>?</given-names>
            </name>
            <name name-style="western">
              <surname>Holtan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kongsgaard</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Rustøen</surname>
              <given-names>Tone</given-names>
            </name>
          </person-group>
          <article-title>Pain in elderly hospitalized cancer patients with bone metastases in Norway</article-title>
          <source>Int J Palliat Nurs</source>
          <year>2008</year>
          <month>05</month>
          <volume>14</volume>
          <issue>5</issue>
          <fpage>238</fpage>
          <lpage>245</lpage>
          <pub-id pub-id-type="doi">10.12968/ijpn.2008.14.5.29491</pub-id>
          <pub-id pub-id-type="medline">18563017</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chawla</surname>
              <given-names>NV</given-names>
            </name>
            <name name-style="western">
              <surname>Bowyer</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>LO</given-names>
            </name>
            <name name-style="western">
              <surname>Kegelmeyer</surname>
              <given-names>WP</given-names>
            </name>
          </person-group>
          <article-title>SMOTE: synthetic minority over-sampling technique</article-title>
          <source>J Artif Intell Res</source>
          <year>2002</year>
          <month>06</month>
          <day>01</day>
          <volume>16</volume>
          <fpage>321</fpage>
          <lpage>357</lpage>
          <pub-id pub-id-type="doi">10.1613/jair.953</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Pang</surname>
              <given-names>HH</given-names>
            </name>
            <name name-style="western">
              <surname>Chiu</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>EY</given-names>
            </name>
            <name name-style="western">
              <surname>Vardhanabhuti</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Effect of machine learning re-sampling techniques for imbalanced datasets in F-FDG PET-based radiomics model on prognostication performance in cohorts of head and neck cancer patients</article-title>
          <source>Eur J Nucl Med Mol Imaging</source>
          <year>2020</year>
          <month>11</month>
          <day>06</day>
          <volume>47</volume>
          <issue>12</issue>
          <fpage>2826</fpage>
          <lpage>2835</lpage>
          <pub-id pub-id-type="doi">10.1007/s00259-020-04756-4</pub-id>
          <pub-id pub-id-type="medline">32253486</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00259-020-04756-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tibshirani</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Regression shrinkage and selection via The Lasso: a retrospective</article-title>
          <source>J R Stat Soc Series B Stat Methodol</source>
          <year>2011</year>
          <volume>73</volume>
          <issue>3</issue>
          <fpage>273</fpage>
          <lpage>282</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1467-9868.2011.00771.x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Mao</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Machine and deep learning based radiomics models for preoperative prediction of benign and malignant sacral tumors</article-title>
          <source>Front Oncol</source>
          <year>2020</year>
          <month>10</month>
          <day>16</day>
          <volume>10</volume>
          <fpage>564725</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33178593"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fonc.2020.564725</pub-id>
          <pub-id pub-id-type="medline">33178593</pub-id>
          <pub-id pub-id-type="pmcid">PMC7596901</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shur</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Doran</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ap Dafydd</surname>
              <given-names>Derfel</given-names>
            </name>
            <name name-style="western">
              <surname>Downey</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>O'Connor</surname>
              <given-names>James P B</given-names>
            </name>
            <name name-style="western">
              <surname>Papanikolaou</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Messiou</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Koh</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Orton</surname>
              <given-names>MR</given-names>
            </name>
          </person-group>
          <article-title>Radiomics in oncology: a practical guide</article-title>
          <source>Radiographics</source>
          <year>2021</year>
          <month>10</month>
          <volume>41</volume>
          <issue>6</issue>
          <fpage>1717</fpage>
          <lpage>1732</lpage>
          <pub-id pub-id-type="doi">10.1148/rg.2021210037</pub-id>
          <pub-id pub-id-type="medline">34597235</pub-id>
          <pub-id pub-id-type="pmcid">PMC8501897</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fawcett</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>An introduction to ROC analysis</article-title>
          <source>Pattern Recognit Lett</source>
          <year>2006</year>
          <month>6</month>
          <volume>27</volume>
          <issue>8</issue>
          <fpage>861</fpage>
          <lpage>874</lpage>
          <pub-id pub-id-type="doi">10.1016/j.patrec.2005.10.010</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fleischman</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Frazer</surname>
              <given-names>DG</given-names>
            </name>
            <name name-style="western">
              <surname>Daya</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Jui</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Newgard</surname>
              <given-names>CD</given-names>
            </name>
          </person-group>
          <article-title>Effectiveness and safety of fentanyl compared with morphine for out-of-hospital analgesia</article-title>
          <source>Prehosp Emerg Care</source>
          <year>2010</year>
          <month>03</month>
          <day>03</day>
          <volume>14</volume>
          <issue>2</issue>
          <fpage>167</fpage>
          <lpage>175</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/20199230"/>
          </comment>
          <pub-id pub-id-type="doi">10.3109/10903120903572301</pub-id>
          <pub-id pub-id-type="medline">20199230</pub-id>
          <pub-id pub-id-type="pmcid">PMC2924527</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fernández</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>García</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Galar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Prati</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Krawczyk</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Herrera</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Learning from imbalanced data streams</article-title>
          <source>Learning from Imbalanced Data Sets</source>
          <year>2018</year>
          <publisher-loc>Cham</publisher-loc>
          <publisher-name>Spirnger</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Deep learning vs. radiomics for predicting axillary lymph node metastasis of breast cancer using ultrasound images: don't forget the peritumoral region</article-title>
          <source>Front Oncol</source>
          <year>2020</year>
          <month>1</month>
          <day>31</day>
          <volume>10</volume>
          <fpage>53</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32083007"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fonc.2020.00053</pub-id>
          <pub-id pub-id-type="medline">32083007</pub-id>
          <pub-id pub-id-type="pmcid">PMC7006026</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lisson</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Lisson</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Mezger</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Wolf</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidt</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Thaiss</surname>
              <given-names>WM</given-names>
            </name>
            <name name-style="western">
              <surname>Tausch</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Beer</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Stilgenbauer</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Beer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Goetz</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Deep neural networks and machine learning radiomics modelling for prediction of relapse in mantle cell lymphoma</article-title>
          <source>Cancers (Basel)</source>
          <year>2022</year>
          <month>04</month>
          <day>15</day>
          <volume>14</volume>
          <issue>8</issue>
          <fpage>2008</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=cancers14082008"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/cancers14082008</pub-id>
          <pub-id pub-id-type="medline">35454914</pub-id>
          <pub-id pub-id-type="pii">cancers14082008</pub-id>
          <pub-id pub-id-type="pmcid">PMC9028737</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thai-Nghe</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Gantner</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidt-Thieme</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Cost-sensitive learning methods for imbalanced data</article-title>
          <year>2010</year>
          <conf-name>The 2010 International Joint Conference on Neural Networks (IJCNN)</conf-name>
          <conf-date>July 18-23, 2010</conf-date>
          <conf-loc>Barcelona</conf-loc>
          <pub-id pub-id-type="doi">10.1109/ijcnn.2010.5596486</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>La Cour</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ghosh</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Stahlbock</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Crone</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lessmann</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Effects of Oversampling Versus Cost-Sensitive Learning for Bayesian and SVM Classifiers</article-title>
          <source>Data Mining. Annals of Information Systems (volume 8)</source>
          <year>2010</year>
          <publisher-loc>Boston, MA</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tamang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Humbert-Droz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gianfrancesco</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Izadi</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Schmajuk</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Yazdany</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Practical considerations for developing clinical natural language processing systems for population health management and measurement</article-title>
          <source>JMIR Med Inform</source>
          <year>2023</year>
          <month>01</month>
          <day>03</day>
          <volume>11</volume>
          <fpage>e37805</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2023//e37805/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/37805</pub-id>
          <pub-id pub-id-type="medline">36595345</pub-id>
          <pub-id pub-id-type="pii">v11i1e37805</pub-id>
          <pub-id pub-id-type="pmcid">PMC9846439</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
