<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR AI</journal-id><journal-id journal-id-type="publisher-id">ai</journal-id><journal-id journal-id-type="index">41</journal-id><journal-title>JMIR AI</journal-title><abbrev-journal-title>JMIR AI</abbrev-journal-title><issn pub-type="epub">2817-1705</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v4i1e74053</article-id><article-id pub-id-type="doi">10.2196/74053</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Assessing Revisit Risk in Emergency Department Patients: Machine Learning Approach</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Juang</surname><given-names>Wang-Chuan</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Cai</surname><given-names>Zheng-Xun</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Chen</surname><given-names>Chia-Mei</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>You</surname><given-names>Zhi-Hong</given-names></name><xref ref-type="aff" rid="aff4">4</xref></contrib></contrib-group><aff id="aff1"><institution>Quality Management Center, Kaohsiung Veterans General Hospital</institution><addr-line>No.386, Dazhong 1st Rd., Zuoying Dist.</addr-line><addr-line>Kaohsiung</addr-line><country>Taiwan</country></aff><aff id="aff2"><institution>Department of Business Management, College of Management, National Sun Yat-sen University</institution><addr-line>Kaohsiung</addr-line><country>Taiwan</country></aff><aff id="aff3"><institution>Department of Health-Business Administration, Fooyin University</institution><addr-line>Kaohsiung</addr-line><country>Taiwan</country></aff><aff id="aff4"><institution>Department of Information Management, College of Management, National Sun Yat-sen University</institution><addr-line>Kaohsiung</addr-line><country>Taiwan</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Luo</surname><given-names>Gang</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Do&#x011F;aner</surname><given-names>Adem</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Bai</surname><given-names>Enze</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Wang-Chuan Juang, MD, Quality Management Center, Kaohsiung Veterans General Hospital, No.386, Dazhong 1st Rd., Zuoying Dist., Kaohsiung, 813414, Taiwan, 886 7-342-2121 ext 4191; <email>wcchuang@vghks.gov.tw</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>7</day><month>8</month><year>2025</year></pub-date><volume>4</volume><elocation-id>e74053</elocation-id><history><date date-type="received"><day>17</day><month>03</month><year>2025</year></date><date date-type="rev-recd"><day>30</day><month>05</month><year>2025</year></date><date date-type="accepted"><day>30</day><month>05</month><year>2025</year></date></history><copyright-statement>&#x00A9; Wang-Chuan Juang, Zheng-Xun Cai, Chia-Mei Chen, Zhi-Hong You. Originally published in JMIR AI (<ext-link ext-link-type="uri" xlink:href="https://ai.jmir.org">https://ai.jmir.org</ext-link>), 7.8.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR AI, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.ai.jmir.org/">https://www.ai.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://ai.jmir.org/2025/1/e74053"/><abstract><sec><title>Background</title><p>Overcrowded emergency rooms might degrade the quality of care and overload the clinic staff. Assessing unscheduled return visits (URVs) to the emergency department (ED) is a quality assurance procedure to identify ED-discharged patients with a high likelihood of bounce-back, to ensure patient safety, and ultimately to reduce medical costs by decreasing the frequency of URVs. The field of machine learning (ML) has evolved considerably in the past decades, and many ML applications have been deployed in various contexts.</p></sec><sec><title>Objective</title><p>This study aims to develop an ML-assisted framework that identifies high-risk patients who may revisit the ED within 72 hours after the initial visit. Furthermore, this study evaluates different ML models, feature sets, and feature encoding methods in order to build an effective prediction model.</p></sec><sec sec-type="methods"><title>Methods</title><p>This study proposes an ML-assisted system that extracts the features from both structured and unstructured medical data to predict patients who are likely to revisit the ED, where the structured data includes patients&#x2019; electronic health records, and the unstructured data is their medical notes (subjective, objective, assessment, and plan). A 5-year dataset consisting of 184,687 ED visits, along with 324,111 historical electronic health records and the associated medical notes, was obtained from Kaohsiung Veterans General Hospital, a tertiary medical center in Taiwan, to evaluate the proposed system.</p></sec><sec sec-type="results"><title>Results</title><p>The evaluation results indicate that incorporating convolutional neural network&#x2013;based feature extraction from unstructured ED physician narrative notes, combined with structured vital signs and demographic data, significantly enhances predictive performance. The proposed approach achieves an area under the receiver operating characteristic curve of 0.705 and a recall of 0.718, demonstrating its effectiveness in predicting URVs. These findings highlight the potential of integrating structured and unstructured clinical data to improve predictive accuracy in this context.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>The study demonstrates that an ML-assisted framework may be applied as a decision support tool to assist ED clinicians in identifying revisiting patients, although the model&#x2019;s performance may not be sufficient for clinic implementation. Given the improvement in the area under the receiver operating characteristic curve, the proposed framework should be further explored as a workable decision support tool to pinpoint ED patients with a high risk of revisit and provide them with appropriate and timely care.</p></sec></abstract><kwd-group><kwd>unscheduled return visit</kwd><kwd>machine learning</kwd><kwd>electronic health records</kwd><kwd>deep learning</kwd><kwd>clinical decision support system</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Background</title><p>Health care services are inherently risky, as they might involve unpredictable events. Risks may damage a health care provider&#x2019;s finances, patient safety, staff satisfaction, or liabilities. Risk management in health care is extremely important&#x2014;as human lives are on the line&#x2014;which consists of a complex set of clinical and administrative systems, processes, procedures, and reporting structures designed to monitor, identify, assess, mitigate, or prevent risks to patients.</p><p>The coordination between primary care providers and hospitals in Taiwan often lacks a streamlined and effective referral mechanism, contributing significantly to emergency department (ED) overcrowding. In Taiwan, patients often seek medical support from major medical institutions rather than local clinics. This tendency may be attributed to the structure of the national health care insurance system in Taiwan, where diagnostic fees are similar between local clinics and large medical institutions. In the current system, patients with nonemergency conditions frequently bypass local clinics and primary care providers, opting to visit the ED directly. Moreover, primary care providers may fail to appropriately direct patients to specialized departments or hospitals due to limited communication channels, inadequate follow-up procedures, or the absence of clear referral protocols. Without a robust referral system, conditions that could be managed effectively in primary care settings are unnecessarily escalated to emergency care, further straining ED resources.</p><p>Premature self-discharge, where patients choose to leave the ED before completing their prescribed treatment or before being officially discharged by medical professionals, is a significant contributing factor to ED overcrowding in Taiwan. This behavior often stems from patients&#x2019; subjective perception of their condition improving or from a lack of understanding of the importance of completing treatment. Cultural attitudes toward health and limited medical knowledge further exacerbate this issue, as patients may misinterpret temporary symptom relief as a full recovery. Such self-discharges frequently result in incomplete or interrupted care, which can lead to complications or the progression of the underlying medical condition. Consequently, these patients are likely to return to the ED when their symptoms reappear or deteriorate, thereby increasing the number of unscheduled return visits (URVs). This not only strains ED resources but also disrupts patient flow and increases the workload for health care providers. Additionally, premature self-discharge may be influenced by nonmedical factors, such as long waiting times, perceived inconvenience, or economic pressures, despite Taiwan&#x2019;s universal health care system. Patients who prioritize immediate symptom relief over long-term health outcomes may also undervalue the importance of follow-up care and professional medical advice.</p><p>Patients admitted to the ED often require timely health care resources. A growing number of ED patients in recent years demand more health care resources than ever [<xref ref-type="bibr" rid="ref1">1</xref>]; overcrowded emergency rooms are a common phenomenon worldwide. According to Taiwan&#x2019;s ED statistical data [<xref ref-type="bibr" rid="ref2">2</xref>], more than 6.1 million ED visits in 2022 contributed to a 13.6% increase compared with 2021. Among the ED admissions, patients with varying severity of diseases or comorbidities request even more health care services. Efficient use of ED services becomes a challenge for health care management, where the unexpected ED revisit rate is a common performance metric. The number of revisits could be reduced if a clinic support system assesses the revisit risk at a patient&#x2019;s initial visit to the ED.</p><p>Addressing the issue of ED overcrowding requires the implementation of long-term solutions aimed at optimizing health care resource allocation and improving patient flow management. While systemic changes, such as enhancing primary care accessibility and strengthening referral mechanisms, are critical, such reforms often require significant time and policy adjustments. To provide immediate and practical relief, this study focuses on the development of a clinical decision support system designed to predict the likelihood of patient unplanned revisits. By leveraging predictive analytics, the proposed clinical decision support system enables health care providers to identify high-risk patients and implement targeted interventions, such as personalized discharge planning and follow-up care. These measures not only improve patient outcomes but also help alleviate the burden on EDs, offering a scalable and effective tool to mitigate overcrowding while broader systemic solutions are pursued.</p><p>The applications of information technology to improve health care delivery have been appreciated for decades. To control risks and reduce clinical errors, health care organizations can learn from retrospective events. Health information technologies, such as electronic health records (EHRs), provide good access to retrospective patient information. With the expanding applications of machine learning (ML) on outcome prediction, these use cases have demonstrated the applicability of assessing patient risk from data repositories. Therefore, this study aims to develop an ML-assisted model that predicts URVs in the ED and anticipates that such an application could improve patient safety and reduce medical costs by decreasing the frequency of URVs.</p></sec><sec id="s1-2"><title>Related Work</title><p>It is critical for emergency clinicians to determine high-risk patients who might return in worse conditions or even die. A study [<xref ref-type="bibr" rid="ref3">3</xref>] on predictors of 30-day ED revisits and 90-day functional decline or mortality concluded that age, sex, polypharmacy, and cognitive impairment were independent predictors of a 30-day ED revisit and that no effective clinical prediction model could be developed. Another study [<xref ref-type="bibr" rid="ref4">4</xref>] analyzed multi-state ED revisit data. Within 3 days of an index ED visit, 8.2% of patients returned within 72 hours; 32% of those revisits occurred at a different health care institution. Revisit rates varied by diagnosis and by state. Research on ED revisits in different countries yielded varying findings. To differentiate patient risk groups, an analytic study [<xref ref-type="bibr" rid="ref5">5</xref>] collected 10-year EHR data from multiple health care institutes and applied group-based trajectory modeling. Patients with behavioral diagnoses, injuries, alcohol and substance abuse, stroke, or diabetes had a higher risk of revisiting.</p><p>Several studies [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>] analyzed ED revisit cases in Taiwan. The first study concluded the following findings: 5.47% of patients had a revisit within 72 hours; most revisits were related to illness; and abdominal pain was the most common presentation (55.7%). The second analysis, focusing on unplanned revisits with abdominal pain, demonstrated that older patients receiving multiple analgesics and laboratory tests had a high risk of URV. The third work summarized factors that may impact ED revisits, including blood pressure, pulse rate, fever, triage level, gender, and main illness, while old age was identified as a key factor. The fourth work investigated the risk factors of ED revisits among patients younger than 50 years and applied the decision tree (DT) to identify the variables capable of partitioning the groups into URVs and non-URVs. They found that the Charlson Comorbidity Index (CCI) scores for URVs are higher than those of non-URVs, and the triage levels of URVs are more severe than those of non-URVs.</p><p>A prior study [<xref ref-type="bibr" rid="ref9">9</xref>] analyzed 48-hour ED revisits in a hospital in Thailand. In addition to their revisits mostly being related to gastrointestinal illness (28.76%), they observed the key predictive factors similar to Taiwan&#x2019;s previous research. The past work encouraged further study to evaluate the most common and critical causes of revisits to improve revisit prediction. Most of the past research analyzed URV cases, excluding non-URV cases, and then applied statistical approaches to determine the common factors of URV patients. Even though most ED patients were non-URVs, they might exhibit some similar clinical characteristics to URV cases. Modern ML models might be able to learn the correlations among those features.</p><p>A review study [<xref ref-type="bibr" rid="ref10">10</xref>] explored the existing research that applied ML models to predict ED revisits. Logistic regression (LR) is the most widely used method, while extreme gradient boosting generally exhibits superior performance. Developing ML prediction models for ED URVs is feasible; however, improving the accuracy beyond 0.75 remains a challenge.</p><p>Vest and Ben-Assuli [<xref ref-type="bibr" rid="ref11">11</xref>] applied a DT algorithm to predict the risk of 30-day ED readmissions. Social determinants of health measurements have poor discriminating ability, but the prediction performance improves with more patient information, including current triage and historical data. McCusker et al [<xref ref-type="bibr" rid="ref12">12</xref>] designed a screening tool with 27 self-report screening questions to assess health risks in senior patients during the 6 months following their initial ED visits. Davazdahemami et al [<xref ref-type="bibr" rid="ref13">13</xref>] adopted a deep neural network model to predict URVs to the ED. They applied the word embedding model (Doc2Vec) to encode unstructured physician notes and concluded that leveraging structured and unstructured EHR data improves prediction performance.</p></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Population and Setting</title><p>Kaohsiung Veterans General Hospital (KVGH) is one of Taiwan&#x2019;s largest general hospitals serving the southern region of Taiwan and offering inpatient, outpatient, and ED health care services. This study analyzed the retrospective administrative medical data of outpatients who sought ED services at KVGH between January 2018 and December 2022. The studied data contains 2 parts, structured and unstructured data, where structured data refers to EHR data and unstructured data consists of subjective, objective, assessment, and plan notes.</p><p><xref ref-type="fig" rid="figure1">Figure 1</xref> outlines the workflow when a patient submits a discharge request. In the initial stage, the system retrieves the patient&#x2019;s medical records and analyzes them in the subsequent stage. The model then assesses the likelihood of the patient revisiting the ED within 72 hours based on their medical data. The prediction outcomes serve as decision support for physicians in the clinical assessment process. If no significant risk factors for readmission are identified, the discharge request is approved. However, if the model predicts a high probability of an unplanned revisit, physicians may advise the patient to stay and provide an explanation of their medical condition. <xref ref-type="table" rid="table1">Tables 1</xref><xref ref-type="table" rid="table2"/>-<xref ref-type="table" rid="table3">3</xref> outline the demographics of the studied dataset.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>A patient discharge workflow. CDSS: clinical decision support system; EHR: electronic health record.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v4i1e74053_fig01.png"/></fig><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>The demographic of the numeric variables in the studied dataset.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="top">Variables</td><td align="left" valign="top">Mean (SD)</td><td align="left" valign="top">Median (range)</td></tr></thead><tbody><tr><td align="left" valign="top">Age (years)</td><td align="char" char="." valign="top">53.90 (21.02)</td><td align="left" valign="top">55 (17-111)</td></tr><tr><td align="left" valign="top">HBP<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup></td><td align="char" char="." valign="top">134.14 (23.96)</td><td align="left" valign="top">133 (12-279)</td></tr><tr><td align="left" valign="top">LBP<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="char" char="." valign="top">80.55 (14.88)</td><td align="left" valign="top">80 (6-227)</td></tr><tr><td align="left" valign="top">MAP<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="char" char="." valign="top">98.50 (16.34)</td><td align="left" valign="top">97.67 (17-230)</td></tr><tr><td align="left" valign="top">Pulse</td><td align="char" char="." valign="top">79.91 (15.57)</td><td align="left" valign="top">78 (5-275)</td></tr><tr><td align="left" valign="top">Temperature</td><td align="char" char="." valign="top">36.60 (0.76)</td><td align="left" valign="top">36.50 (25-44)</td></tr><tr><td align="left" valign="top">Breath</td><td align="char" char="." valign="top">17.53 (2.36)</td><td align="left" valign="top">18 (1-79)</td></tr><tr><td align="left" valign="top">SPO<sub>2</sub></td><td align="char" char="." valign="top">97.43 (3.30)</td><td align="left" valign="top">98 (51-100)</td></tr><tr><td align="left" valign="top">Hospitalization hours</td><td align="char" char="." valign="top">5.07 (5.56)</td><td align="left" valign="top">2.75 (0&#x2010;24)</td></tr><tr><td align="left" valign="top">Number of lab results</td><td align="char" char="." valign="top">17.25 (10.79)</td><td align="left" valign="top">20 (0&#x2010;75)</td></tr><tr><td align="left" valign="top">Number of medicine</td><td align="char" char="." valign="top">4.04 (2.66)</td><td align="left" valign="top">4 (0&#x2010;26)</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>HBP: high blood pressure.</p></fn><fn id="table1fn2"><p><sup>b</sup>LBP: low blood pressure.</p></fn><fn id="table1fn3"><p><sup>c</sup>MAP: mean arterial pressure.</p></fn></table-wrap-foot></table-wrap><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>The demographic of the temporal variables in the studied dataset.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="top">Variables</td><td align="left" valign="top">Range</td></tr></thead><tbody><tr><td align="left" valign="top">Admission time</td><td align="left" valign="top">January 1, 2018 (12:01 AM), to December 31, 2022 (11:43 PM)</td></tr><tr><td align="left" valign="top">Discharge time</td><td align="left" valign="top">January 1, 2018 (1:07 AM), to January 2, 2023 (3:59 PM)</td></tr><tr><td align="left" valign="top">Measure time</td><td align="left" valign="top">January 1, 2018 (1:01 AM), to March 16, 2023 (3:17 PM)</td></tr><tr><td align="left" valign="top">Medication begin time</td><td align="left" valign="top">January 1, 2018 (12:25 AM), to January 2, 2023 (11:47 AM)</td></tr><tr><td align="left" valign="top">Medication end time</td><td align="left" valign="top">January 1, 2018 (12:26 AM), to January 23, 2023 (11:59 PM)</td></tr><tr><td align="left" valign="top">Order check time</td><td align="left" valign="top">January 1, 2018 (12:00 AM), to January 4, 2023 (11:43 AM)</td></tr></tbody></table></table-wrap><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>The demographic of the categorical variables in the studied dataset.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="top">Variables</td><td align="left" valign="top">Categories</td></tr></thead><tbody><tr><td align="left" valign="top">TTAS<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="top">Resuscitation, emergent, urgent, less urgent, and nonurgent</td></tr><tr><td align="left" valign="top">Visit disposition</td><td align="left" valign="top">ED<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup>, admission, outpatient, transfer out, and other</td></tr><tr><td align="left" valign="top">Medication frequency</td><td align="left" valign="top">statstat, urgent, once, stat, regular, oncedown, statstdn, and statdown</td></tr><tr><td align="left" valign="top"><italic>ICD-10</italic><sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup></td><td align="left" valign="top">A00-B99, C00-D49, D50-D89, E00-E89, F00-F99, G00-G99, H00-H59, H60-H95, I00-I99, J00-J99, K00-K95, L00-L99, M00-M99, N00-N99, O00-O9A, P00-P96, Q00-Q99, R00-R99, S00-T88, V00-Y99, Z00-Z99, and U00-U85</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>TTAS: Taiwan Triage Acuity Scale.</p></fn><fn id="table3fn2"><p><sup>b</sup>ED: emergency department.</p></fn><fn id="table3fn3"><p><sup>c</sup><italic>ICD-10</italic>: <italic>International Statistical Classification of Diseases, Tenth Revision</italic>.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-2"><title>Prediction Target</title><p>The collected data were divided into 2 cohort groups: URV patients and non-URV patients. Our prediction target is a binary indicator of 72-hour URV (coded as URV/non-URV) in ED. Each visit is labeled with an associated indicator column to indicate whether the patient had an ED revisit within 72 hours.</p></sec><sec id="s2-3"><title>Ethical Considerations</title><p>This study was conducted in accordance with the principles outlined in the Declaration of Helsinki and received approval from the Institutional Review Board (IRB) of KVGH with IRB certification number KSVGH23-CT5-04 (date of approval: October 31, 2023). The requirement for consent to participate was waived by the IRB of KVGH, as the research uses historical electronic medical records without any direct patient intervention. All data points have been deidentified, and no specific individual can be identified from the data. The rights and interests of the patients are not harmed, and this study does not have any impact on patients&#x2019; treatment and medication before and after analyzing the data.</p></sec><sec id="s2-4"><title>Model Development</title><p><xref ref-type="fig" rid="figure2">Figure 2</xref> outlines the proposed system architecture consisting of the following modules: data preprocessing, feature selection, feature embedding, and prediction model. Each is explained in the following sections.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>The architecture of the proposed framework. EHR: electronic health record.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v4i1e74053_fig02.png"/></fig></sec><sec id="s2-5"><title>Data Preprocessing</title><p>The studied data consists of 2 parts: structured and unstructured data. This module performs data cleansing and normalization tasks, removing missing fields and out-of-range data and subsequently normalizing data into a consistent range. Variable values within the same range avoid the problem of excessive weight on certain variable values and then improve the performance of model training. According to preliminary studies, <italic>z</italic> score standardization performs better than Min-Max normalization. This study applies <italic>z</italic> score standardization to normalize and redistribute all pathological feature values to the same interval.</p></sec><sec id="s2-6"><title>Model Variable Selection</title><p>Model variables, aka features, provide information for the model, and ML algorithms can automatically determine feature weights during the training process. Typically, incorporating more variables can enhance performance. However, irrelevant variables may negatively affect prediction accuracy. Therefore, in real-world applications, feature selection or model variable selection is a critical process for identifying relevant ones to construct an effective prediction model. Without loss of generality, this research adopts the term feature to describe the model variable.</p><p>The studied dataset comprises 24 distinct features, including both structured and unstructured data. Structured data are derived from EHR, while unstructured data contents originate from clinicians&#x2019; medical notes. To appropriately integrate unstructured data, subjective complaints recorded in medical notes are transformed into corresponding <italic>ICD-10</italic> (<italic>International Statistical Classification of Diseases, Tenth Revision</italic>) codes. This mechanism converts unstructured medical notes into structured data while preserving their original information.</p><p>This study defines 3 feature sets (FSs), denoted as FS<sub>A</sub>, FS<sub>B</sub>, and FS<sub>C</sub>. FS<sub>A</sub> contains all features in the dataset to evaluate model performance without applying any feature selection procedure. Based on preliminary experiments, features related to lab orders and medical orders were found to have no positive impact on the prediction model and were thus excluded from both FS<sub>B</sub> and FS<sub>C</sub>. To further analyze the effect of incorporating unstructured data on model performance, features derived from unstructured data were removed from FS<sub>B</sub>. <xref ref-type="table" rid="table4">Table 4</xref> provides a summary of the features in these 3 sets.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Feature description.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="top">Feature</td><td align="left" valign="top">Type</td><td align="left" valign="top">FS<sub>A</sub><sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup></td><td align="left" valign="top">FS<sub>B</sub></td><td align="left" valign="top">FS<sub>C</sub></td></tr></thead><tbody><tr><td align="left" valign="top">Basic ED<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup> visit record</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Gender</td><td align="left" valign="top">Cat</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top">&#x2714;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Age</td><td align="left" valign="top">Num</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top">&#x2714;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Admission time</td><td align="left" valign="top">Num</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Discharge time</td><td align="left" valign="top">Num</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>ICD-10</italic><sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td><td align="left" valign="top">Cat</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top">&#x2714;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>TTAS<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup></td><td align="left" valign="top">Cat</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top">&#x2714;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hospitalization days</td><td align="left" valign="top">Num</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Visit disposition</td><td align="left" valign="top">Cat</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top">&#x2714;</td></tr><tr><td align="left" valign="top" colspan="5">Vital Sign</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Patient ID</td><td align="left" valign="top">Cat</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top">&#x2714;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Case number</td><td align="left" valign="top">Cat</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Measure time</td><td align="left" valign="top">Num</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>HBP<sup><xref ref-type="table-fn" rid="table4fn5">e</xref></sup></td><td align="left" valign="top">Num</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top">&#x2714;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>LBP<sup><xref ref-type="table-fn" rid="table4fn6">f</xref></sup></td><td align="left" valign="top">Num</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top">&#x2714;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Pulse</td><td align="left" valign="top">Num</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top">&#x2714;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Temperature</td><td align="left" valign="top">Num</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top">&#x2714;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Breath</td><td align="left" valign="top">Num</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="5">Lab Order</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Order Check Time</td><td align="left" valign="top">Num</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lab test name</td><td align="left" valign="top">Cat</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lab result</td><td align="left" valign="top">Num</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="5">Medication Order</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Medication begin time</td><td align="left" valign="top">Num</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Medication end time</td><td align="left" valign="top">Num</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Medicine</td><td align="left" valign="top">Cat</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Dosage</td><td align="left" valign="top">Num</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Frequency</td><td align="left" valign="top">Cat</td><td align="left" valign="top">&#x2714;</td><td align="left" valign="top"/><td align="left" valign="top"/></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>FS: feature set.</p></fn><fn id="table4fn2"><p><sup>b</sup>ED: emergency department.</p></fn><fn id="table4fn3"><p><sup>c</sup>ICD-10: International Classification of Diseases-10.</p></fn><fn id="table4fn4"><p><sup>d</sup>TTAS: Taiwan Triage Acuity Scale.</p></fn><fn id="table4fn5"><p><sup>e</sup>HBP: high blood pressure.</p></fn><fn id="table4fn6"><p><sup>f</sup>LBP: low blood pressure.</p></fn></table-wrap-foot></table-wrap><p>It is important to note that the patient ID is deidentified and serves to indicate a specific patient, while the case number is a serial identifier for an ED visit. Both features are excluded from the prediction model during training.</p><p>ED visits are listed in chronological order. For structured data, each visit is characterized by the following types of features: (1) basic ED visit record, (2) vital signs, and (3) care order information (as outlined in <xref ref-type="table" rid="table4">Table 4</xref>). The basic ED visit record includes gender, age, <italic>ICD-10</italic>, admission time, discharge time, visit disposition, and triage level coded as a categorical variable based on the type and severity of initial presenting signs and symptoms using the Taiwan Triage and Acuity Scale, ranging from 1 (resuscitation) to 5 (nonurgent). The vital signs include body temperature, respiratory rate, pulse, high blood pressure (HBP), low blood pressure, mean arterial pressure, and oxygen saturation. The care order information includes laboratory tests and medication-related information.</p><p>Past studies have revealed that patients with multiple diseases have high risks of ED visits, where such information typically is recorded in unstructured medical notes during the diagnosis. To improve prediction performance, this study extracts diseases from unstructured subjective, objective, assessment, and plan notes, along with the <italic>ICD-10</italic> from EHR, and then calculates the CCI score [<xref ref-type="bibr" rid="ref14">14</xref>] to indicate the patient&#x2019;s condition.</p></sec><sec id="s2-7"><title>Feature Embedding</title><p>Inputs to ML models must be numerical, and therefore, nonnumeric features usually need to be encoded or embedded before feeding them into the model. Feature embedding or feature encoding serves as a bridge between raw data and model inputs, enabling algorithms to operate efficiently on transformed data. Since feature embedding is as critical as feature selection for building an efficient model, this study designs 2 feature encoding schemes to evaluate the impact of feature embedding and to identify the most suitable one for the prediction model. <xref ref-type="table" rid="table5">Table 5</xref> explains the studied feature encoding schemes in detail.</p><table-wrap id="t5" position="float"><label>Table 5.</label><caption><p>Studied encoding methods.</p></caption><table id="table5" frame="hsides" rules="groups"><thead><tr><td align="left" valign="top">Feature</td><td align="left" valign="top">Range</td><td align="left" valign="top">Description</td></tr></thead><tbody><tr><td align="left" valign="bottom" colspan="3">Encoding E<sub>A</sub></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Age<sup><xref ref-type="table-fn" rid="table5fn1">a</xref></sup> (years)</td><td align="left" valign="top">0-5</td><td align="left" valign="top">0: &#x003C;41; 1: 41-50; 2: 51-60; 3: 61-70; 4: 71-80; 5: &#x003E;80</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>MAP<sup><xref ref-type="table-fn" rid="table5fn2">b</xref></sup> (mmHg)</td><td align="left" valign="top">0-2</td><td align="left" valign="top">0: &#x003C;70; 1: 70-100; 2: &#x003E;100</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>HBP<sup><xref ref-type="table-fn" rid="table5fn3">c</xref></sup> (mmHg)</td><td align="left" valign="top">0-2</td><td align="left" valign="top">0: &#x003C;90; 1: 90-120; 2: &#x003E;120</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>LBP<sup><xref ref-type="table-fn" rid="table5fn4">d</xref></sup> (mmHg)</td><td align="left" valign="top">0-2</td><td align="left" valign="top">0: &#x003C;60; 1: 60-80; 2: &#x003E;80</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Pulse rate (bpm)</td><td align="left" valign="top">0-2</td><td align="left" valign="top">0: &#x003C;60; 1: 60-100; 2: &#x003E;100</td></tr><tr><td align="left" valign="top" colspan="3">Encoding E<sub>B</sub></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Age<sup><xref ref-type="table-fn" rid="table5fn5">e</xref></sup> (years)</td><td align="left" valign="top">0-2</td><td align="left" valign="top">0: &#x003C;41; 1: 41-65; 2: &#x003E;65</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>MAP (mmHg)</td><td align="left" valign="top">0-1</td><td align="left" valign="top">0: 70-100; 1: otherwise</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>HBP (mmHg)</td><td align="left" valign="top">0-1</td><td align="left" valign="top">0: 90-120; 1: otherwise</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>LBP (mmHg)</td><td align="left" valign="top">0-1</td><td align="left" valign="top">0: 60-80; 1: otherwise</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Pulse Rate (bpm)</td><td align="left" valign="top">0-1</td><td align="left" valign="top">0: 60-100; 1: otherwise</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Temperature (&#x00B0;C)</td><td align="left" valign="top">0-1</td><td align="left" valign="top">0: 35-38; 1: otherwise</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SPO<sub>2</sub> (%)<sup><xref ref-type="table-fn" rid="table5fn6">f</xref></sup></td><td align="left" valign="top">0-1</td><td align="left" valign="top">0: 95-100; 1: otherwise</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lab test count</td><td align="left" valign="top">0-&#x221E;</td><td align="left" valign="top">Count for the total number of the ordered lab tests</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Medicine count</td><td align="left" valign="top">0-&#x221E;</td><td align="left" valign="top">Count the total number of the ordered medicines</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>ICD-10<sup><xref ref-type="table-fn" rid="table5fn7">g</xref></sup></td><td align="left" valign="top">0-22</td><td align="left" valign="top">According to [<xref ref-type="bibr" rid="ref15">15</xref>]</td></tr></tbody></table><table-wrap-foot><fn id="table5fn1"><p><sup>a</sup>Based on Charlson Comorbidity Index.</p></fn><fn id="table5fn2"><p><sup>b</sup>MAP: mean arterial pressure.</p></fn><fn id="table5fn3"><p><sup>c</sup>HBP: high blood pressure.</p></fn><fn id="table5fn4"><p><sup>d</sup>LBP: low blood pressure.</p></fn><fn id="table5fn5"><p><sup>e</sup>Based on Chen et al [<xref ref-type="bibr" rid="ref16">16</xref>].</p></fn><fn id="table5fn6"><p><sup>f</sup>SpO<sub>2</sub>: saturation of peripheral oxygen.</p></fn><fn id="table5fn7"><p><sup>g</sup><italic>ICD-10</italic>: <italic>International Statistical Classification of Diseases, Tenth Revision</italic>.</p></fn></table-wrap-foot></table-wrap><p>The studied data contains a mix of numerical and categorical data. Even though the studied structured data is mostly numerical, its values represent different meanings. Vital signs are in numerical form but can be interpreted as categorical variables, as vital signs usually have a normal range. For example, HBP can be tiered into 3 levels&#x2014;0 (low HBP), 1 (normal HBP), and 2 (high HBP)&#x2014;as shown in the first encoding method of <xref ref-type="table" rid="table5">Table 5</xref>. On the other hand, for the ML model, low HBP and high HBP both imply the patient&#x2019;s HBP is not in the normal range, and there might not be much difference between too high and too low. Therefore, the HBP feature value can be interpreted as normal or nonnormal. As expressed in the second encoding method of <xref ref-type="table" rid="table5">Table 5</xref>, it is categorized into 2 types: 0 for normal HBP and 1 for HBP not in the normal range. Those numerical features not listed in the table are applied in their original numerical values to the ML models.</p><p>When working with categorical data, such as disease names, it is critical to convert them into a numerical format so that ML algorithms can understand them. One-hot encoding is commonly used for encoding categorical variables. This study adopts an improved one-hot encoding scheme, which presents a group of related categories together, as illustrated in <xref ref-type="fig" rid="figure3">Figure 3</xref>.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Pandas&#x2019; one-hot embedding method.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v4i1e74053_fig03.png"/></fig></sec><sec id="s2-8"><title>Class Imbalance</title><p>Training an effective model requires a balanced or near-balanced class distribution. However, the datasets collected from real-world environments are typically imbalanced, as most ED visits are non-URV cases, which constitute the major class. Sampling is a process of resampling data to improve dataset distribution, whereas oversampling is a process of increasing the sampling rate of the minority class, while undersampling reduces the sampling rate of the majority class.</p><p>Oversampling techniques applied to the minority class, which are widely used to address data imbalance issues, may introduce several significant challenges, particularly in the medical domain. For instance, methods such as random duplication of existing data can lead to model overfitting, as the model may overly rely on a restricted subset of the input. Furthermore, approaches like SMOTE or other algorithms that dynamically generate synthetic data may pose ethical and legal concerns, as the generated data could be false or misleading, ultimately negatively impacting the prediction model. In contrast, random undersampling can effectively reduce a considerable number of non-URV records, resulting in a balanced dataset with minimal information loss.</p><p>Based on the aforementioned analysis, this study adopts random undersampling to achieve a balanced dataset while minimizing the risks associated with oversampling techniques. Given that oversampling may introduce model overfitting and ethical concerns due to synthetic data generation, random undersampling presents a more reliable approach by reducing the number of non-URV records without compromising data integrity. This method ensures that the dataset maintains a proportional distribution between classes, thereby enhancing the model&#x2019;s generalizability and mitigating bias.</p></sec><sec id="s2-9"><title>Prediction Model</title><p>To identify the optimal ML algorithms tailored for the proposed framework, this study evaluates various classification algorithms commonly used in related literature. These include DT, LR, random forest (RF), support vector machine (SVM), one-class support vector machine (OCSVM), grid search cross-validation (GSCV), multilayer perceptron (MLP), convolutional neural network (CNN), tree-based pipeline optimization tool, and long short-term memory (LSTM).</p><p>Hyperparameter fine-tuning is a critical process that directly influences model performance. To determine the optimal hyperparameters for each algorithm, multiple combinations of hyperparameter sets are independently evaluated.</p><p>Additionally, the different FSs and feature encoding methods described earlier are assessed to construct an effective URV prediction model.</p><p>To develop and evaluate the prediction models, the dataset was randomly partitioned into training and testing sets with a ratio of 8:2. This process was repeated 10 times with different random splits, and the final performance metrics were reported as the average across these 10 runs to ensure robustness and reduce variance due to data partitioning.</p></sec><sec id="s2-10"><title>System Interface</title><p>The proposed system is designed to provide a straightforward and user-friendly interface, enabling physicians to efficiently enter medical records, as illustrated in <xref ref-type="fig" rid="figure4">Figure 4</xref>.</p><p>The interface consists of 2 primary sections: the clinical data input section and the model output section. The clinical data input section includes structured data fields for entering numerical values, as well as dropdown menus for selecting categorical features. The use of dropdown menus minimizes potential input errors and reduces input time, thereby enhancing data entry efficiency. Once the required data are entered, they are fed into the pretrained prediction model upon submission. The prediction model then analyzes the clinical input data to determine whether a patient is at risk of revisiting the ED within 72 hours. The prediction output provides the likelihood of a revisit along with the model&#x2019;s decision, offering physicians a clear assessment of patient risk.</p><p>The intuitive design of the interface increases physician adoption and usability, facilitating seamless integration into clinical workflows. By streamlining data entry and automating risk assessment, the system improves decision-making efficiency while minimizing potential input errors. The straightforward structure ensures that physicians can quickly interpret and act upon prediction results, ultimately supporting more effective ED management.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Graphical user interface of the proposed system as a standalone application.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v4i1e74053_fig04.png"/></fig></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Overview</title><p>According to past studies and our preliminary study, several factors might impact training efficiency. Therefore, this study conducts 2 experiments in order to obtain an efficient URV prediction model for ED by evaluating different ML models, FSs, and encoding schemes. The first experiment investigates the prediction performance of traditional and modern ML algorithms by applying 2 types of FSs (a complete set vs a subset of selected features), and the second experiment evaluates the impact of feature encoding.</p><p><xref ref-type="fig" rid="figure5">Figure 5</xref> illustrates the process of data selection, data filtering, and the study timeline for a retrospective medical study. The selection process begins with 184,687 ED patients treated between January 2018 and December 2022. EHRs were retrieved from the KVGH database for these patients. To ensure data validity, a screening criterion was applied, requiring at least one valid ED admission. As a result, 34 patients were excluded, leaving a final study cohort of 184,653 patients for analysis.</p><p>All experiments were performed on a personal computing workstation configured with a 12th Generation Intel Core i7 CPU, 32 GB of RAM, an NVIDIA RTX 3060 dedicated GPU, and a 512 GB solid-state drive.</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Participant selection, data, and timeline. ED: emergency department; EHR: electronic health record; KVGH: Kaohsiung Veterans General Hospital; URV: unscheduled return visit.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v4i1e74053_fig05.png"/></fig></sec><sec id="s3-2"><title>Performance Measurement</title><p>Model performance is evaluated using metrics such as accuracy, recall, and the area under the receiver operating characteristic curve (AUROC). AUROC is a widely used metric for assessing the effectiveness of binary classification models, as the receiver operating characteristic curve illustrates the trade-off between the true positive rate and the false positive rate across various decision thresholds. AUROC values range from 0.5 to 1.0, where a value of 0.5 indicates that the model performs no better than random chance in distinguishing between the 2 classes.</p><p>Certain models may achieve a high recall rate but low accuracy, while others may exhibit high accuracy but low recall. Neither type of model is suitable for reliable prediction. Since AUROC accounts for both aspects of classification performance, this study selects AUROC as the primary metric for evaluating prediction performance.</p></sec><sec id="s3-3"><title>Performance Evaluation of ML Models for URV Prediction</title><p>This section investigates the predictive performance of various ML algorithms using different FSs: FS<sub>A</sub>, FS<sub>B</sub>, and FS<sub>C</sub>. These ML algorithms iteratively learn important patterns from the input data and adjust feature weights accordingly. However, an excessive number of features can introduce noise and negatively impact model training, highlighting the necessity of a feature selection process during training. A carefully selected subset of key features may yield more effective performance. Therefore, in addition to evaluating various ML models, this experiment also examines the effectiveness of the selected features.</p><p><xref ref-type="table" rid="table6">Table 6</xref> summarizes the results, comparing 2 categories of ML models: traditional ML and modern ML. In terms of predictive modeling, modern ML algorithms generally require longer training times but produce better prediction models compared with traditional ML algorithms, with the exception of LSTM. The best-performing modern ML model (CNN) surpasses the best-performing traditional ML model (LR) and outperforms all other models, achieving superior performance with a reasonable training time.</p><table-wrap id="t6" position="float"><label>Table 6.</label><caption><p>The results of experiment 1.</p></caption><table id="table6" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model, encoding, and FS<sup><xref ref-type="table-fn" rid="table6fn1">a</xref></sup></td><td align="left" valign="bottom">Accuracy</td><td align="left" valign="bottom">Recall</td><td align="left" valign="bottom">AUROC<sup><xref ref-type="table-fn" rid="table6fn2">b</xref></sup></td><td align="left" valign="bottom">Training time (sec)</td></tr></thead><tbody><tr><td align="left" valign="top">Traditional ML models</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>DT<sup><xref ref-type="table-fn" rid="table6fn3">c</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>E<sub>A</sub></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>A</sub></td><td align="left" valign="top">0.290</td><td align="left" valign="top">0.908</td><td align="left" valign="top">0.588</td><td align="left" valign="top">0.02</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>B</sub></td><td align="left" valign="top">0.857</td><td align="left" valign="top">0.283</td><td align="left" valign="top">0.581</td><td align="left" valign="top">0.03</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>C</sub></td><td align="left" valign="top">0.805</td><td align="left" valign="top">0.362</td><td align="left" valign="top">0.592</td><td align="left" valign="top">0.02</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>LR<sup><xref ref-type="table-fn" rid="table6fn4">d</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>E<sub>A</sub></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>A</sub></td><td align="left" valign="top">0.624</td><td align="left" valign="top">0.602</td><td align="left" valign="top">0.636</td><td align="left" valign="top">0.07</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>B</sub></td><td align="left" valign="top">0.547</td><td align="left" valign="top">0.614</td><td align="left" valign="top">0.609</td><td align="left" valign="top">0.07</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>C</sub></td><td align="left" valign="top">0.628</td><td align="left" valign="top">0.602</td><td align="left" valign="top">0.615</td><td align="left" valign="top">0.07</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>OCSVM<sup><xref ref-type="table-fn" rid="table6fn5">e</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>E<sub>A</sub></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>A</sub></td><td align="left" valign="top">0.348</td><td align="left" valign="top">0.871</td><td align="left" valign="top">0.600</td><td align="left" valign="top">1.19</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>B</sub></td><td align="left" valign="top">0.140</td><td align="left" valign="top">0.893</td><td align="left" valign="top">0.502</td><td align="left" valign="top">0.48</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>C</sub></td><td align="left" valign="top">0.169</td><td align="left" valign="top">0.894</td><td align="left" valign="top">0.518</td><td align="left" valign="top">0.40</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>RF<sup><xref ref-type="table-fn" rid="table6fn6">f</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>E<sub>A</sub></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>A</sub></td><td align="left" valign="top">0.628</td><td align="left" valign="top">0.636</td><td align="left" valign="top">0.632</td><td align="left" valign="top">1.11</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>B</sub></td><td align="left" valign="top">0.629</td><td align="left" valign="top">0.548</td><td align="left" valign="top">0.590</td><td align="left" valign="top">0.53</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>C</sub></td><td align="left" valign="top">0.633</td><td align="left" valign="top">0.619</td><td align="left" valign="top">0.626</td><td align="left" valign="top">0.94</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SVM<sup><xref ref-type="table-fn" rid="table6fn7">g</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>E<sub>A</sub></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>A</sub></td><td align="left" valign="top">0.432</td><td align="left" valign="top">0.689</td><td align="left" valign="top">0.556</td><td align="left" valign="top">4.99</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>B</sub></td><td align="left" valign="top">0.411</td><td align="left" valign="top">0.725</td><td align="left" valign="top">0.562</td><td align="left" valign="top">4.06</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>C</sub></td><td align="left" valign="top">0.678</td><td align="left" valign="top">0.558</td><td align="left" valign="top">0.620</td><td align="left" valign="top">3.76</td></tr><tr><td align="left" valign="top">Modern ML<sup><xref ref-type="table-fn" rid="table6fn8">h</xref></sup> models</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>CNN<sup><xref ref-type="table-fn" rid="table6fn9">i</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>E<sub>A</sub></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>A</sub></td><td align="left" valign="top">0.565</td><td align="left" valign="top">0.718</td><td align="left" valign="top">0.705</td><td align="left" valign="top">48.61</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>B</sub></td><td align="left" valign="top">0.629</td><td align="left" valign="top">0.562</td><td align="left" valign="top">0.647</td><td align="left" valign="top">48.36</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>C</sub></td><td align="left" valign="top">0.646</td><td align="left" valign="top">0.620</td><td align="left" valign="top">0.698</td><td align="left" valign="top">42.74</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>GSCV<sup><xref ref-type="table-fn" rid="table6fn10">j</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>E<sub>A</sub></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>A</sub></td><td align="left" valign="top">0.630</td><td align="left" valign="top">0.640</td><td align="left" valign="top">0.639</td><td align="left" valign="top">864.23</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>B</sub></td><td align="left" valign="top">0.645</td><td align="left" valign="top">0.560</td><td align="left" valign="top">0.600</td><td align="left" valign="top">888.46</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>C</sub></td><td align="left" valign="top">0.693</td><td align="left" valign="top">0.577</td><td align="left" valign="top">0.637</td><td align="left" valign="top">882.76</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>LSTM<sup><xref ref-type="table-fn" rid="table6fn11">k</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>E<sub>A</sub></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>A</sub></td><td align="left" valign="top">0.043</td><td align="left" valign="top">0.989</td><td align="left" valign="top">0.568</td><td align="left" valign="top">52.35</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>B</sub></td><td align="left" valign="top">0.503</td><td align="left" valign="top">0.538</td><td align="left" valign="top">0.526</td><td align="left" valign="top">50.95</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>C</sub></td><td align="left" valign="top">0.608</td><td align="left" valign="top">0.565</td><td align="left" valign="top">0.633</td><td align="left" valign="top">51.27</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>MLP<sup><xref ref-type="table-fn" rid="table6fn12">l</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>E<sub>A</sub></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>A</sub></td><td align="left" valign="top">0.568</td><td align="left" valign="top">0.719</td><td align="left" valign="top">0.692</td><td align="left" valign="top">13.06</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>B</sub></td><td align="left" valign="top">0.803</td><td align="left" valign="top">0.321</td><td align="left" valign="top">0.626</td><td align="left" valign="top">8.32</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>C</sub></td><td align="left" valign="top">0.649</td><td align="left" valign="top">0.613</td><td align="left" valign="top">0.691</td><td align="left" valign="top">14.87</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>TPOT<sup><xref ref-type="table-fn" rid="table6fn13">m</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>E<sub>A</sub></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>A</sub></td><td align="left" valign="top">0.642</td><td align="left" valign="top">0.685</td><td align="left" valign="top">0.663</td><td align="left" valign="top">183.23</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>B</sub></td><td align="left" valign="top">0.653</td><td align="left" valign="top">0.556</td><td align="left" valign="top">0.607</td><td align="left" valign="top">148.94</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>C</sub></td><td align="left" valign="top">0.684</td><td align="left" valign="top">0.614</td><td align="left" valign="top">0.650</td><td align="left" valign="top">177.05</td></tr></tbody></table><table-wrap-foot><fn id="table6fn1"><p><sup>a</sup>FS: feature set.</p></fn><fn id="table6fn2"><p><sup>b</sup>AUROC: area under the receiver operating characteristic.</p></fn><fn id="table6fn3"><p><sup>c</sup>DT: decision tree.</p></fn><fn id="table6fn4"><p><sup>d</sup>LR: logistic regression.</p></fn><fn id="table6fn5"><p><sup>e</sup>OCSVM: one-class support vector machine.</p></fn><fn id="table6fn6"><p><sup>f</sup>RF: random forest.</p></fn><fn id="table6fn7"><p><sup>g</sup>SVM: support vector machine.</p></fn><fn id="table6fn8"><p><sup>h</sup>ML: machine learning.</p></fn><fn id="table6fn9"><p><sup>i</sup>CNN: convolutional neural network.</p></fn><fn id="table6fn10"><p><sup>j</sup>GSCV: grid search cross-validation.</p></fn><fn id="table6fn11"><p><sup>k</sup>LSTM: long short-term memory.</p></fn><fn id="table6fn12"><p><sup>l</sup>MLP: multilayer perceptron.</p></fn><fn id="table6fn13"><p><sup>m</sup>TPOT: tree-based pipeline optimization tool.</p></fn></table-wrap-foot></table-wrap><p>Among these combinations, LR with FS<sub>A</sub> outperforms other traditional ML algorithms in terms of AUROC, which is indicative of overall model performance. The evaluated traditional ML models (DT, SVM, and OCSVM) exhibit diverse prediction performances, with some demonstrating high accuracy but low recall, while others show high recall but low accuracy. Notably, LR and RF deliver stable performance across both metrics.</p><p>In contrast, most modern ML models yield stable prediction performance, except for LSTM. While LSTM is highly suitable for time-series prediction, it is not appropriate for the current dataset, leading to the poorest performance among all modern ML and traditional ML models, except OCSVM with FS<sub>B</sub>. Given that the studied dataset comprises only 24 distinct features, simpler algorithms such as DT and LR in traditional ML and CNN in modern ML outperform more complex models.</p><p>The superior performance of simpler models on this dataset can be attributed to the nature of the data. Complex algorithms, such as LSTM, typically require larger datasets with extensive FSs to effectively capture patterns and avoid overfitting. When applied to datasets with fewer features, these models are more prone to overfitting, leading to reduced generalization and poorer performance. In contrast, simpler algorithms, which rely on fewer parameters and are less prone to overfitting, can effectively handle smaller datasets, making them more suitable in such cases.</p></sec><sec id="s3-4"><title>Impact of Feature Set on Model Performance</title><p>With respect to feature selection, the complete FS (FS<sub>A</sub>) generally builds better prediction models compared with the subsets (FS<sub>B</sub> and FS<sub>C</sub>) according to the results in <xref ref-type="table" rid="table6">Table 6</xref>. The discrepancies in AUROC between FS<sub>A</sub> and FS<sub>C</sub> fall within &#x00B1;1, suggesting that the subset contains critical determinants for URV prediction. Both FS<sub>B</sub> and FS<sub>C</sub> primarily consist of vital signs and age, indicating that these are key features for URV prediction. Moreover, FS<sub>C</sub> incorporates medical notes and outperforms FS<sub>B</sub> across all evaluation models, highlighting the importance of unstructured data in enhancing predictive performance.</p></sec><sec id="s3-5"><title>Comparison of Training Time Across ML Models</title><p>Regarding training time, traditional ML algorithms generally require less time to complete their training phases compared with modern ML algorithms. GSCV, for instance, requires at least 860 seconds to build a prediction model but does not achieve the best detection results. In contrast, CNN, which yields the best performance, completes its training phase in an average of 48 seconds, while MLP, the second-best algorithm, requires less than 15 seconds on average. As MLP is a simplified version of CNN, it is expected that CNN takes longer training time than MLP. Notably, both MLP and CNN outperform other models, with only minor discrepancies observed between their performances.</p></sec><sec id="s3-6"><title>Performance Evaluation of ML Models With Different Feature Encoding</title><p>This section investigates the impact of feature encoding on model training. This experiment evaluates 2 encoding methods (E<sub>A</sub> and E<sub>B</sub>) on the 2 best prediction models (MLP and CNN) with the best FS (FS<sub>A</sub>) obtained from the previous experiment and another feature subset (FS<sub>C</sub>), since FS<sub>C</sub> outperforms FS<sub>B</sub> across all evaluation models. The studied encoding methods are described in the previous section and outlined in <xref ref-type="table" rid="table5">Table 5</xref>. FS<sub>C</sub> includes FS<sub>B</sub> and some other relevant features, as shown in <xref ref-type="table" rid="table4">Table 4</xref>, in order to investigate the encoding impact on different types of features.</p><p><xref ref-type="table" rid="table7">Table 7</xref> lists the evaluation results, where the boldface figure indicates the best of a given performance measurement. The results demonstrate that the encoding method has a certain impact on model training. A simplified encoding E<sub>B</sub> performs better than E<sub>A</sub>. That is, categorizing vital signs into 2 types (normal and abnormal) can better represent the meaning of the features than the 3 types (low, normal, and high); converting <italic>ICD-10</italic> into 22 categories defined by World Health Organization can better represent the meaning of the diseases; age classified into 3 categories (0: &#x003C;41 years; 1: 41-65 years; 2: &#x003E;65 years) is better than the 6 categories defined by CCI (0: &#x003C;41 years; 1: 41-50 years; 2: 51-60 years; 3: 61-70 years; 4: 71-80 years; 5: &#x003E;80 years).</p><table-wrap id="t7" position="float"><label>Table 7.</label><caption><p>The results of experiment 2.</p></caption><table id="table7" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model and FS<sup><xref ref-type="table-fn" rid="table7fn1">a</xref></sup></td><td align="left" valign="bottom">Encoding</td><td align="left" valign="bottom">Accuracy</td><td align="left" valign="bottom">Recall</td><td align="left" valign="bottom">AUROC<sup><xref ref-type="table-fn" rid="table7fn2">b</xref></sup></td></tr></thead><tbody><tr><td align="left" valign="top">MLP<sup><xref ref-type="table-fn" rid="table7fn3">c</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>A</sub></td><td align="left" valign="top">E<sub>A</sub></td><td align="left" valign="top">0.568</td><td align="left" valign="top">0.719</td><td align="left" valign="top">0.692</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>A</sub></td><td align="left" valign="top">E<sub>B</sub></td><td align="left" valign="top">0.602</td><td align="left" valign="top">0.724</td><td align="left" valign="top">0.734</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>C</sub></td><td align="left" valign="top">E<sub>A</sub></td><td align="left" valign="top">0.649<sup><xref ref-type="table-fn" rid="table7fn4">d</xref></sup></td><td align="left" valign="top">0.613</td><td align="left" valign="top">0.694</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>C</sub></td><td align="left" valign="top">E<sub>B</sub></td><td align="left" valign="top">0.620</td><td align="left" valign="top">0.652</td><td align="left" valign="top">0.698</td></tr><tr><td align="left" valign="top">CNN<sup><xref ref-type="table-fn" rid="table7fn5">e</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>A</sub></td><td align="left" valign="top">E<sub>A</sub></td><td align="left" valign="top">0.565</td><td align="left" valign="top">0.718</td><td align="left" valign="top">0.705</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>A</sub></td><td align="left" valign="top">E<sub>B</sub></td><td align="left" valign="top">0.606</td><td align="left" valign="top">0.740<sup><xref ref-type="table-fn" rid="table7fn4">d</xref></sup></td><td align="left" valign="top">0.747<sup><xref ref-type="table-fn" rid="table7fn4">d</xref></sup></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>C</sub></td><td align="left" valign="top">E<sub>A</sub></td><td align="left" valign="top">0.646</td><td align="left" valign="top">0.620</td><td align="left" valign="top">0.698</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FS<sub>C</sub></td><td align="left" valign="top">E<sub>B</sub></td><td align="left" valign="top">0.625</td><td align="left" valign="top">0.673</td><td align="left" valign="top">0.715</td></tr></tbody></table><table-wrap-foot><fn id="table7fn1"><p><sup>a</sup>FS: feature set.</p></fn><fn id="table7fn2"><p><sup>b</sup>AUROC: area under the receiver operating characteristic curve.</p></fn><fn id="table7fn3"><p><sup>c</sup>MLP: multilayer perceptron.</p></fn><fn id="table7fn4"><p><sup>d</sup>The best of the given performance measurement.</p></fn><fn id="table7fn5"><p><sup>e</sup>CNN: convolutional neural network.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-7"><title>Model Parameters</title><p>The CNN model architecture consists of a repeated block structure, composed of two 1D convolutional layers followed by a 1D max-pooling layer. This block is repeated 5 times, after which the output is passed to a fully connected layer and finally mapped to the probability of a URV.</p><p>Each convolutional layer uses 64 filters with a kernel size of 3 and uses the rectified linear unit as the activation function. The max-pooling layer is configured with a pool size of 2.</p><p>For model training, the number of epochs was set to 100, and an early stopping mechanism was implemented to prevent overfitting, with a patience value of 25. The model was optimized using the Nadam optimizer with a batch size of 256. A dynamic learning rate adjustment strategy was applied, where the learning rate was reduced by a factor of 0.5 if no improvement was observed for 5 consecutive epochs. The minimum learning rate was set to 1<sup>e&#x2013;4</sup>, with epsilon set to 0.0001.</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>This study proposes an ML-assisted system for predicting patients at risk of revisiting the ED, leveraging features extracted from both structured and unstructured medical data. The structured data consists of patients&#x2019; EHRs, while the unstructured data includes medical notes. The findings indicate that the conventional trade-off between training time and prediction performance may not be universally applicable. While traditional ML models require significantly less training time, modern ML models demand at least twice as much, if not more. When computational resources or training time are constrained, traditional ML models such as LR can serve as effective prediction tools; however, when such limitations are not a major concern, CNN is recommended. Additionally, while incorporating a broad range of relevant features enhances predictive performance, a subset of key features may have a dominant impact on model outcomes. In particular, vital signs and age are identified as critical predictors for URV, and properly encoding features into the appropriate categories can further improve model efficiency.</p><p>In this study, 2 encoding strategies (E<sub>A</sub> and E<sub>B</sub>) were evaluated. The experimental results indicate that models trained on datasets encoded using the E<sub>B</sub> approach consistently outperform those trained with the E<sub>A</sub> approach. This performance difference can be attributed to the characteristics of the respective encoding methods. Although E<sub>B</sub> uses a relatively simpler encoding scheme, it distinctly classifies variables into 2 well-defined categories: normal and abnormal. In contrast, E<sub>A</sub> uses a 3-category system&#x2014; &#x201C;too low,&#x201D; &#x201C;normal,&#x201D; and &#x201C;too high.&#x201D; However, the categories &#x201C;too low&#x201D; and &#x201C;too high&#x201D; both represent abnormal conditions and may not be sufficiently distinguishable in practice. This lack of distinction could introduce ambiguity for the predictive model, thereby adversely affecting its performance.</p><p>For practical implementation, AUROC is used to represent the overall performance of a model. Models with higher AUROC values are associated with fewer false alerts while maintaining an acceptable true positive rate. According to the experimental results, among traditional ML models, LR demonstrates the best performance in predicting URV, achieving an AUROC of 0.636. Among modern ML models, CNN outperforms its counterparts in terms of AUROC values.</p><p>In scenarios where capturing all URV cases is prioritized, recall serves as a critical performance indicator. Among traditional ML models, DT achieves the highest recall rate of 0.908, while among modern ML models, LSTM achieves the highest recall value of 0.989. However, it is noteworthy that both DT and LSTM exhibit low accuracy values, indicating that these models tend to generate a considerable number of false alerts.</p></sec><sec id="s4-2"><title>Limitations</title><p>A notable finding is that, although advanced CNN-based models such as LSTM typically outperform CNN in most ML applications, this advantage does not necessarily hold in URV prediction for ED visits. One possible explanation is that ED visits often lack prior knowledge of a patient&#x2019;s visit history, which limits the predictive capacity of sequential models like LSTM. Furthermore, the absence of sufficient medical history may constrain the overall performance of ML-based prediction models. Future research could explore the integration of patients&#x2019; comprehensive medical histories to enhance predictive accuracy. Additionally, the diverse causes of ED revisits present a challenge for ML models, as they make it difficult to distinguish patterns among different revisit cases. Investigating ML-based predictions for specific revisit causes may further refine model performance.</p><p>Given the nonstandardized nature of medical notes, this study transforms the unstructured textual content into corresponding <italic>ICD-10</italic> codes. This structured representation has been shown to enhance the predictive performance of the model. However, medical notes possess a wide array of clinically relevant information beyond <italic>ICD-10</italic> codes, including chief complaints, prior treatments, and allergy histories. Therefore, the application of advanced natural language processing techniques may further improve predictive outcomes by enabling the extraction of richer features from unstructured clinical text.</p></sec><sec id="s4-3"><title>Comparison With Prior Work</title><p>Previous studies mostly focused on general revisits, while studies specifically addressing ED revisits were relatively understudied. Most existing work (Vest and Ben-Assuli [<xref ref-type="bibr" rid="ref11">11</xref>]) considered a long prediction window, such as 30 days, while revisit time frames are likely shorter, for example, 72 hours [<xref ref-type="bibr" rid="ref12">12</xref>]. Most existing prediction models selected features from merely one type of EHR data, rarely considering both types of patients&#x2019; medical data: structured EHR and unstructured medical notes. Prior studies [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>] that applied ML prediction models primarily evaluated 1 or 2 models and rarely analyzed the performance of multiple prediction models or various FSs.</p><p>A similar study by Guo et al [<xref ref-type="bibr" rid="ref8">8</xref>] on ED revisits incorporated both structured and unstructured medical records by converting them into semantic patterns and developing a customized bidirectional encoder representations from transformers (BERT) model, referred to as BlueBERT, to predict URVs. The issue of data imbalance, with URV cases accounting for only 2.22% of their studied dataset, was addressed using random undersampling techniques. Their experimental results demonstrated the superiority of BlueBERT compared with other models, such as KNN, RF, and XGB, in terms of AUROC.</p><p>To the best of our knowledge, our study is one of the few attempts to combine 2 types of patients&#x2019; medical data (structured and unstructured) to identify unplanned revisits to the ED and is the first study that conducts a comprehensive performance evaluation of traditional as well as modern ML classification models, where the traditional ones include LR, RF, SVM, and OCSVM and the modern ones include GSCV, MLP, CNN, tree-based pipeline optimization tool, and an improved CNN LSTM. Furthermore, this study analyzes the importance of feature selection and the impact of feature embedding on the efficiency of model training.</p></sec><sec id="s4-4"><title>Conclusions</title><p>This study evaluates both traditional ML and modern ML models for predicting the URVs in ED and examines the impacts of feature selection and feature encoding on model training. The evaluation concludes the following findings: (1) adopting an appropriate model is important for a targeted problem, (2) not all the MLL models are superior to traditional ML ones, (3) an advanced modern ML model might not yield better performance than a basic modern ML model (such as CNN) or a traditional ML (such as LR), (4) a complicated algorithm requiring long training time (such as GSCV) might not construct an efficient prediction model, (5) feature selection is relevant to build an efficient model, (6) finding key features is critical for interpreting the prediction results, (7) feature encoding affects the efficiency of model training, and (8) an encoding scheme which better represents the meaning of the features could yield a better prediction model.</p></sec></sec></body><back><fn-group><fn fn-type="con"><p>C-MC and W-CJ contributed to the conceptualization of the study. C-MC, Z-HY, and Z-XC developed the methodology. Z-HY was responsible for the software. W-CJ, C-MC, and Z-XC performed the validation. Z-HY and W-CJ collected the data. C-MC and Z-XC prepared the original draft of the manuscript. W-CJ reviewed and edited the manuscript. Z-XC and Z-HY created the visualizations. W-CJ and C-MC supervised the work. W-CJ managed the project administration.</p></fn><fn fn-type="conflict"><p>W-CJ is an employee of Kaohsiung Veterans General Hospital and receives a salary from the institution. The other authors declare that they have no competing interests or financial support related to this study.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AUROC</term><def><p>area under the receiver operating characteristic</p></def></def-item><def-item><term id="abb2">BERT</term><def><p>bidirectional encoder representations from transformers</p></def></def-item><def-item><term id="abb3">CCI</term><def><p>Charlson Comorbidity Index</p></def></def-item><def-item><term id="abb4">CNN</term><def><p>convolutional neural network</p></def></def-item><def-item><term id="abb5">DT</term><def><p>decision tree</p></def></def-item><def-item><term id="abb6">ED</term><def><p>emergency department</p></def></def-item><def-item><term id="abb7">EHR</term><def><p>electronic health record</p></def></def-item><def-item><term id="abb8">FS</term><def><p>feature set</p></def></def-item><def-item><term id="abb9">GSCV</term><def><p>grid search cross-validation</p></def></def-item><def-item><term id="abb10">HBP</term><def><p>high blood pressure</p></def></def-item><def-item><term id="abb11"><italic>ICD-10</italic></term><def><p><italic>International Statistical Classification of Diseases, Tenth Revision</italic></p></def></def-item><def-item><term id="abb12">IRB</term><def><p>institutional review board</p></def></def-item><def-item><term id="abb13">KVGH</term><def><p>Kaohsiung Veterans General Hospital</p></def></def-item><def-item><term id="abb14">LR</term><def><p>logistic regression</p></def></def-item><def-item><term id="abb15">LSTM</term><def><p>long short-term memory</p></def></def-item><def-item><term id="abb16">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb17">MLP</term><def><p>multilayer perceptron</p></def></def-item><def-item><term id="abb18">OCSVM</term><def><p>one-class support vector machine</p></def></def-item><def-item><term id="abb19">RF</term><def><p>random forest</p></def></def-item><def-item><term id="abb20">SVM</term><def><p>support vector machine</p></def></def-item><def-item><term id="abb21">URV</term><def><p>unscheduled return visit</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pines</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Mutter</surname><given-names>RL</given-names> </name><name name-style="western"><surname>Zocchi</surname><given-names>MS</given-names> </name></person-group><article-title>Variation in emergency department admission rates across the United States</article-title><source>Med Care Res Rev</source><year>2013</year><month>04</month><volume>70</volume><issue>2</issue><fpage>218</fpage><lpage>231</lpage><pub-id pub-id-type="doi">10.1177/1077558712470565</pub-id><pub-id pub-id-type="medline">23295438</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="web"><article-title>Open data - emergency department visits</article-title><source>Ministry of Health and Welfare</source><access-date>2025-02-11</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://dep.mohw.gov.tw/Dos/lp-6600-113.html">https://dep.mohw.gov.tw/Dos/lp-6600-113.html</ext-link></comment></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>de Gelder</surname><given-names>J</given-names> </name><name name-style="western"><surname>Lucke</surname><given-names>JA</given-names> </name><name name-style="western"><surname>de Groot</surname><given-names>B</given-names> </name><etal/></person-group><article-title>Predictors and outcomes of revisits in older adults discharged from the emergency department</article-title><source>J Am Geriatr Soc</source><year>2018</year><month>04</month><volume>66</volume><issue>4</issue><fpage>735</fpage><lpage>741</lpage><pub-id pub-id-type="doi">10.1111/jgs.15301</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Duseja</surname><given-names>R</given-names> </name><name name-style="western"><surname>Bardach</surname><given-names>NS</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>GA</given-names> </name><etal/></person-group><article-title>Revisit rates and associated costs after an emergency department encounter: a multistate analysis</article-title><source>Ann Intern Med</source><year>2015</year><month>06</month><day>2</day><volume>162</volume><issue>11</issue><fpage>750</fpage><lpage>756</lpage><pub-id pub-id-type="doi">10.7326/M14-1616</pub-id><pub-id pub-id-type="medline">26030633</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ben-Assuli</surname><given-names>O</given-names> </name><name name-style="western"><surname>Vest</surname><given-names>JR</given-names> </name></person-group><article-title>Return visits to the emergency department: an analysis using group based curve models</article-title><source>Health Informatics J</source><year>2022</year><month>04</month><volume>28</volume><issue>2</issue><fpage>14604582221105444</fpage><pub-id pub-id-type="doi">10.1177/14604582221105444</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wu</surname><given-names>CL</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>FT</given-names> </name><name name-style="western"><surname>Chiang</surname><given-names>YC</given-names> </name><etal/></person-group><article-title>Unplanned emergency department revisits within 72 hours to a secondary teaching referral hospital in Taiwan</article-title><source>J Emerg Med</source><year>2010</year><month>05</month><volume>38</volume><issue>4</issue><fpage>512</fpage><lpage>517</lpage><pub-id pub-id-type="doi">10.1016/j.jemermed.2008.03.039</pub-id><pub-id pub-id-type="medline">18947963</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lin</surname><given-names>LT</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>SF</given-names> </name><name name-style="western"><surname>Chao</surname><given-names>CC</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>HA</given-names> </name></person-group><article-title>Predictors of 72-h unscheduled return visits with admission in patients presenting to the emergency department with abdominal pain</article-title><source>Eur J Med Res</source><year>2023</year><month>08</month><day>17</day><volume>28</volume><issue>1</issue><fpage>288</fpage><pub-id pub-id-type="doi">10.1186/s40001-023-01256-7</pub-id><pub-id pub-id-type="medline">37592352</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Guo</surname><given-names>DY</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>KH</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>IC</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>KY</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>YC</given-names> </name><name name-style="western"><surname>Hsiao</surname><given-names>KY</given-names> </name></person-group><article-title>The association between emergency department revisit and elderly patients</article-title><source>J Acute Med</source><year>2020</year><month>03</month><day>1</day><volume>10</volume><issue>1</issue><fpage>20</fpage><lpage>26</lpage><pub-id pub-id-type="doi">10.6705/j.jacme.202003_10(1).0003</pub-id><pub-id pub-id-type="medline">32995151</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tangkulpanich</surname><given-names>P</given-names> </name><name name-style="western"><surname>Yuksen</surname><given-names>C</given-names> </name><name name-style="western"><surname>Kongchok</surname><given-names>W</given-names> </name><name name-style="western"><surname>Jenpanitpong</surname><given-names>C</given-names> </name></person-group><article-title>Clinical predictors of emergency department revisits within 48 hours of discharge; a case control study</article-title><source>Arch Acad Emerg Med</source><year>2021</year><volume>9</volume><issue>1</issue><fpage>e1</fpage><pub-id pub-id-type="doi">10.22037/aaem.v9i1.891</pub-id><pub-id pub-id-type="medline">33313568</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>YC</given-names> </name><name name-style="western"><surname>Ng</surname><given-names>CJ</given-names> </name><name name-style="western"><surname>Hsu</surname><given-names>CC</given-names> </name><name name-style="western"><surname>Cheng</surname><given-names>CW</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>SY</given-names> </name></person-group><article-title>Machine learning models for predicting unscheduled return visits to an emergency department: a scoping review</article-title><source>BMC Emerg Med</source><year>2024</year><month>01</month><day>30</day><volume>24</volume><issue>1</issue><fpage>20</fpage><pub-id pub-id-type="doi">10.1186/s12873-024-00939-6</pub-id><pub-id pub-id-type="medline">38287243</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vest</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Ben-Assuli</surname><given-names>O</given-names> </name></person-group><article-title>Prediction of emergency department revisits using area-level social determinants of health measures and health information exchange information</article-title><source>Int J Med Inform</source><year>2019</year><month>09</month><volume>129</volume><fpage>205</fpage><lpage>210</lpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2019.06.013</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>McCusker</surname><given-names>J</given-names> </name><name name-style="western"><surname>Bellavance</surname><given-names>F</given-names> </name><name name-style="western"><surname>Cardin</surname><given-names>S</given-names> </name><name name-style="western"><surname>Belzile</surname><given-names>E</given-names> </name><name name-style="western"><surname>Verdon</surname><given-names>J</given-names> </name></person-group><article-title>Prediction of hospital utilization among elderly patients during the 6 months after an emergency department visit</article-title><source>Ann Emerg Med</source><year>2000</year><month>11</month><volume>36</volume><issue>5</issue><fpage>438</fpage><lpage>445</lpage><pub-id pub-id-type="doi">10.1067/mem.2000.110822</pub-id><pub-id pub-id-type="medline">11054196</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Davazdahemami</surname><given-names>B</given-names> </name><name name-style="western"><surname>Peng</surname><given-names>P</given-names> </name><name name-style="western"><surname>Delen</surname><given-names>D</given-names> </name></person-group><article-title>A deep learning approach for predicting early bounce-backs to the emergency departments</article-title><source>Healthcare Analytics</source><year>2022</year><month>11</month><volume>2</volume><fpage>100018</fpage><pub-id pub-id-type="doi">10.1016/j.health.2022.100018</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Charlson</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Pompei</surname><given-names>P</given-names> </name><name name-style="western"><surname>Ales</surname><given-names>KL</given-names> </name><name name-style="western"><surname>MacKenzie</surname><given-names>CR</given-names> </name></person-group><article-title>A new method of classifying prognostic comorbidity in longitudinal studies: development and validation</article-title><source>J Chronic Dis</source><year>1987</year><volume>40</volume><issue>5</issue><fpage>373</fpage><lpage>383</lpage><pub-id pub-id-type="doi">10.1016/0021-9681(87)90171-8</pub-id><pub-id pub-id-type="medline">3558716</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="report"><person-group person-group-type="author"><collab>World Health Organization</collab></person-group><article-title>The ICD-10 classification of mental and behavioural disorders: clinical descriptions and diagnostic guidelines</article-title><year>1992</year><publisher-name>World Health Organization</publisher-name></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>TY</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>TY</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>YC</given-names> </name></person-group><article-title>Using a clinical narrative-aware pre-trained language model for predicting emergency department patient disposition and unscheduled return visits</article-title><source>J Biomed Inform</source><year>2024</year><month>07</month><volume>155</volume><fpage>104657</fpage><pub-id pub-id-type="doi">10.1016/j.jbi.2024.104657</pub-id><pub-id pub-id-type="medline">38772443</pub-id></nlm-citation></ref></ref-list></back></article>