<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR AI</journal-id><journal-id journal-id-type="publisher-id">ai</journal-id><journal-id journal-id-type="index">41</journal-id><journal-title>JMIR AI</journal-title><abbrev-journal-title>JMIR AI</abbrev-journal-title><issn pub-type="epub">2817-1705</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v4i1e65456</article-id><article-id pub-id-type="doi">10.2196/65456</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Estimation of Static Lung Volumes and Capacities From Spirometry Using Machine Learning: Algorithm Development and Validation</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Helgeson</surname><given-names>Scott A</given-names></name><degrees>MS, MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Quicksall</surname><given-names>Zachary S</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Johnson</surname><given-names>Patrick W</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lim</surname><given-names>Kaiser G</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Carter</surname><given-names>Rickey E</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lee</surname><given-names>Augustine S</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Division of Pulmonary and Critical Care Medicine, Mayo Clinic</institution><addr-line>4500 San Pablo Road S</addr-line><addr-line>Jacksonville</addr-line><addr-line>FL</addr-line><country>United States</country></aff><aff id="aff2"><institution>Digital Innovation Laboratory, Department of Quantitative Health Sciences, Mayo Clinic</institution><addr-line>Jacksonville</addr-line><addr-line>FL</addr-line><country>United States</country></aff><aff id="aff3"><institution>Division of Pulmonary and Critical Care Medicine, Mayo Clinic</institution><addr-line>Rochester</addr-line><addr-line>MN</addr-line><country>United States</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Emam</surname><given-names>Khaled El</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Singh</surname><given-names>Karanbir</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Liu</surname><given-names>Songqiao</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Scott A Helgeson, MS, MD, Division of Pulmonary and Critical Care Medicine, Mayo Clinic, 4500 San Pablo Road S, Jacksonville, FL, 32224, United States, 1 9049532000; <email>helgeson.scott@mayo.edu</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>24</day><month>3</month><year>2025</year></pub-date><volume>4</volume><elocation-id>e65456</elocation-id><history><date date-type="received"><day>01</day><month>10</month><year>2024</year></date><date date-type="rev-recd"><day>18</day><month>12</month><year>2024</year></date><date date-type="accepted"><day>09</day><month>02</month><year>2025</year></date></history><copyright-statement>&#x00A9; Scott A Helgeson, Zachary S Quicksall, Patrick W Johnson, Kaiser G Lim, Rickey E Carter, Augustine S Lee. Originally published in JMIR AI (<ext-link ext-link-type="uri" xlink:href="https://ai.jmir.org">https://ai.jmir.org</ext-link>), 24.3.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR AI, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.ai.jmir.org/">https://www.ai.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://ai.jmir.org/2025/1/e65456"/><abstract><sec><title>Background</title><p>Spirometry can be performed in an office setting or remotely using portable spirometers. Although basic spirometry is used for diagnosis of obstructive lung disease, clinically relevant information such as restriction, hyperinflation, and air trapping require additional testing, such as body plethysmography, which is not as readily available. We hypothesize that spirometry data contains information that can allow estimation of static lung volumes in certain circumstances by leveraging machine learning techniques.</p></sec><sec><title>Objective</title><p>The aim of the study was to develop artificial intelligence-based algorithms for estimating lung volumes and capacities using spirometry measures.</p></sec><sec sec-type="methods"><title>Methods</title><p>This study obtained spirometry and lung volume measurements from the Mayo Clinic pulmonary function test database for patient visits between February 19, 2001, and December 16, 2022. Preprocessing was performed, and various machine learning algorithms were applied, including a generalized linear model with regularization, random forests, extremely randomized trees, gradient-boosted trees, and XGBoost for both classification and regression cohorts.</p></sec><sec sec-type="results"><title>Results</title><p>A total of 121,498 pulmonary function tests were used in this study, with 85,017 allotted for exploratory data analysis and model development (ie, training dataset) and 36,481 tests reserved for model evaluation (ie, testing dataset). The median age of the cohort was 64.7 years (IQR 18&#x2010;119.6), with a balanced distribution between genders, consisting 48.2% (n=58,607) female and 51.8% (n=62,889) male patients. The classification models showed a robust performance overall, with relatively low root mean square error and mean absolute error values observed across all predicted lung volumes. Across all lung volume categories, the models demonstrated strong discriminatory capacity, as indicated by the high area under the receiver operating characteristic curve values ranging from 0.85 to 0.99 in the training set and 0.81 to 0.98 in the testing set.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Overall, the models demonstrate robust performance across lung volume measurements, underscoring their potential utility in clinical practice for accurate diagnosis and prognosis of respiratory conditions, particularly in settings where access to body plethysmography or other lung volume measurement modalities is limited.</p></sec></abstract><kwd-group><kwd>artificial intelligence</kwd><kwd>machine learning</kwd><kwd>pulmonary function test</kwd><kwd>spirometry</kwd><kwd>total lung capacity</kwd><kwd>AI</kwd><kwd>ML</kwd><kwd>lung</kwd><kwd>lung volume</kwd><kwd>lung capacity</kwd><kwd>spirometer</kwd><kwd>lung disease</kwd><kwd>database</kwd><kwd>respiratory</kwd><kwd>pulmonary</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Pulmonary function testing (PFT) provides physiological measurements of the respiratory system across multiple dimensions, typically classified into (<xref ref-type="bibr" rid="ref1">1</xref>) spirometry, which measures air flow, lung volumes, and capacities during a expiratory forced vital capacity (FVC) maneuver; (<xref ref-type="bibr" rid="ref2">2</xref>) static lung volumes; and (<xref ref-type="bibr" rid="ref3">3</xref>) gas exchange parameters such as the diffusing capacity for carbon monoxide and oxygen saturations [<xref ref-type="bibr" rid="ref1">1</xref>]. PFTs are critical for the diagnosis and prognostication of respiratory disorders, and provide a noninvasive method for measuring and monitoring the degree of respiratory impairment [<xref ref-type="bibr" rid="ref2">2</xref>]. They are recommended for the initial evaluation of patients with chronic dyspnea and other respiratory symptoms, as well as for individuals at risk of respiratory complications due to transplant or surgery [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>].</p><p>Basic spirometry remains the most widely used component of PFT, largely due to its size and portability, allowing it to be performed in clinic office settings or remotely at home with adequate training. However, spirometry, by definition is an expiratory FVC maneuver that focuses on assessing airflow limitations and does not directly measure static lung volumes, which can be integral to understanding many respiratory conditions [<xref ref-type="bibr" rid="ref4">4</xref>]. Accurate determination of static lung volumes traditionally necessitates more complex and resource-intensive techniques such as body plethysmography or gas dilution methods, with body plethysmography serving as the current gold standard [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. However, these methods, while precise, may not always be readily accessible, cost-effective, or suitable for routine clinical practice outside a specialized pulmonary function laboratory.</p><p>Advancements in artificial intelligence (AI) techniques have introduced new avenues in health care, offering the potential to derive comprehensive insights from existing data, including patterns not easily recognizable through human interpretation or standard statistical modeling. A prior study by Beverin et al [<xref ref-type="bibr" rid="ref7">7</xref>] examined the prediction of total lung capacity from spirometry using three tree-based machine learning (ML) models, achieving a mean squared error of 560.1 mL. They further developed models to classify restrictive ventilatory impairment, achieving a sensitivity and specificity of 83% and 92%, respectively. However, they did not explore prediction of the complete lung volume assessments. Predicting functional residual capacity status, for example, could facilitate the prevention of atelectasis during anesthesia [<xref ref-type="bibr" rid="ref8">8</xref>]. Another study by Evankovich et al [<xref ref-type="bibr" rid="ref9">9</xref>] developed a regression model in patients with chronic obstructive pulmonary disease (COPD) to predict residual volume and its elevation status, achieving an area under the receiver operating characteristic curve (ROC) of 0.95 for predicting residual volume above 175%. However, these models lack applicability beyond the COPD cohort [<xref ref-type="bibr" rid="ref9">9</xref>]. Given this context, we hypothesized that ML models could predict static lung volumes using spirometry alone across a diverse cohort of lung conditions. Such an approach could reduce the need for identifying those who would benefit most from formal lung volume assessments. In this study, we applied ML approaches to develop and validate an algorithm for estimating lung volumes and capacities from standard spirometry. We further examined the model performance among subsets of physiologic derangements such as obstructive and restrictive ventilatory disorders.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Cohort Selection</title><p>This study was approved by the Institutional Review Board (20&#x2010;009821) with a waiver of consent. The dataset curated for this study was obtained from the Mayo Clinic PFT database, which houses PFT data from two distinct US regions (Midwest and Southeast), with records from February 19, 2001, to December 16, 2022. The PFTs performed on the same day&#x2014;with paired spirometry and lung volume data, without the use of methacholine or a bronchodilator&#x2014;were identified. Individuals under 18 years of age and patients who opted out of authorizing their data for research use were excluded from the analysis. All lung volume measurements were performed using body plethysmography. For models trained to classify normal versus abnormal lung volume measures, an additional requirement was applied to ensure nonmissing demographics within the boundaries of the Global Lung Initiative GLI2021 lung volume estimation equations [<xref ref-type="bibr" rid="ref10">10</xref>]. If an individual underwent multiple PFTs, only their most recent PFT measurement comprising both lung volumes and spirometry was used. The following lung volume measures were selected for prediction: expiratory reserve volume (ERV), functional residual capacity (FRC), residual volume (RV), total lung capacity (TLC), the ratio of RV to TLC as a percentage (RV/TLC), and vital capacity (VC).</p></sec><sec id="s2-2"><title>Preprocessing</title><p>Following the initial database query, the dataset was augmented with reference lung function measures for both spirometry and lung volume measures, including the lower limit of normal function (LLN), the upper limit of normal function (ULN), and the expected volume. These values were generated using a custom package built according to the Global Lung Initiative pulmonary function testing reference equation publications [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. The LLN and ULN values were used to assign &#x201C;normal&#x201D; (within the LLN/ULN range) or &#x201C;abnormal&#x201D; (below LLN or above ULN) status to reformulate the lung volume regression problem into a classification task.</p><p>Both the regression and classification data sets were split into independent training and testing subsets using a randomized 70/30 split before any downstream exploratory analysis or model development. Features provided to the models included forced expiratory volume in the first second of exhalation (FEV1), forced vital capacity (FVC), the ratio of FEV1 and FVC (FEV1/FVC), peak expiratory flow, estimated maximum vital capacity, age, gender, height, weight, and race (White, African American, Northeast Asian, Southeast Asian, and Other).</p></sec><sec id="s2-3"><title>Model Selection and Evaluation</title><p>A randomized grid search was performed using various ML algorithms, including a generalized linear model with regularization, distributed random forests, extremely randomized trees, gradient-boosted trees, and XGBoost. Models were tuned using appropriate parameter grids via five-fold cross-validation on the training dataset to provide estimates of performance summarized using applicable metrics, including root mean squared error (RMSE) for regression and area under the receiver operating characteristic curve (ROC-AUC) for classification [<xref ref-type="bibr" rid="ref13">13</xref>]. Final tuning parameters were selected from the candidate model with the highest cross-validation performance (lowest RMSE for regression, highest ROC-AUC for classification), which was ranked highest among all explored configurations. The model was then refitted to the full training data set using the chosen hyperparameters before evaluation on the testing dataset (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). For the classification models, the probability threshold was selected to maximize the Youden index on the training data set.</p><p>The regression model performance was evaluated visually using prediction scatter plots and summary metrics, including RMSE, mean absolute error (MAE), mean signed difference, mean percentage error (MPE), mean absolute percentage error (MAPE), and the correlation-based coefficient of determination [<xref ref-type="bibr" rid="ref14">14</xref>]. The classification model was evaluated with the area under the receiver-operating-characteristic curve (AUC), accuracy , sensitivity (SENS), specificity, positive predictive value, negative predictive value (NPV), precision, recall, positive likelihood ratio (LRT+), negative likelihood ratio (LRT-), odds ratio, and F1-score. All modeling was performed using the H2O AutoML cluster (version 3.44.0.3) [<xref ref-type="bibr" rid="ref15">15</xref>]. Further details regarding the grid search process, parameter tuning, and model implementation are available in the H2O official documentation [<xref ref-type="bibr" rid="ref15">15</xref>] (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>).</p><p>In the cohort summary tables, categorical data were displayed as counts and percentages, while continuous data were displayed as medians and ranges. Standardized mean differences were computed to identify significant differences in variables between the training and testing datasets, with insignificant differences defined as a value &#x003C;0.1. The regression and classification models were applied to the specific PFT patterns (normal, obstructed, restricted, and mixed pattern) defined by the American Thoracic Society (ATS) [<xref ref-type="bibr" rid="ref10">10</xref>]. All analyses were performed using R software (version 4.2.2; R Foundation for Statistical Computing) on a Google Cloud Platform virtual machine.</p></sec><sec id="s2-4"><title>Ethical Considerations</title><p>This study was approved by the Mayo Clinic Institutional Review board (22-009471) and was determined to be exempt (45 CFR 46.104d, Category 4). All data was deidentified for this study, and no compensation was provided to the participants</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><p>A total of 121,498 PFTs were used in this study, with 85,017 allocated for exploratory data analysis and model development and 36,481 tests reserved for model evaluation. The median age across the cohort was 64.7 years (IQR 18&#x2010;119.6), with a nearly balanced gender distribution between genders, with 48.2% (n=58,607) female patients and 51.8% (n=62,889) male patients. The cohort was predominantly White (n= 114,388, 94.1%), followed by African American patients (n=4,656, 3.8%). Of particular importance, the distribution of baseline PFT measures&#x2014;both spirometry and lung volumes&#x2014;showed no differences between the training and testing datasets. Standardized mean differences, indicating the degree of difference between the training and testing sets, were minimal across all variables, suggesting a well-balanced model development and testing cohorts. A complete breakdown is provided in <xref ref-type="table" rid="table1">Table 1</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Cohort summary.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Variables</td><td align="left" valign="bottom">Training dataset<break/>(n=85,015)</td><td align="left" valign="bottom">Testing dataset<break/>(n=36,481)</td><td align="left" valign="bottom">Total (N=121,496)</td><td align="left" valign="bottom">Standardized difference</td></tr></thead><tbody><tr><td align="left" valign="top">Age (years), median (IQR)</td><td align="left" valign="top">64.7 (18.0-119.6)</td><td align="left" valign="top">64.7 (18.0-101.0)</td><td align="left" valign="top">64.7 (18.0-119.6)</td><td align="left" valign="top">.005</td></tr><tr><td align="left" valign="top" colspan="4">Gender, n (%)</td><td align="left" valign="top">.004</td></tr><tr><td align="left" valign="top">&#x2003; Female</td><td align="left" valign="top">40,964 (48.2)</td><td align="left" valign="top">17,643 (48.4)</td><td align="left" valign="top">58,607 (48.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003; Male</td><td align="left" valign="top">44,051 (51.8)</td><td align="left" valign="top">18,838 (51.6)</td><td align="left" valign="top">62,889 (51.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">Race, n (%)</td><td align="left" valign="top">.01</td></tr><tr><td align="left" valign="top">&#x2003;White</td><td align="left" valign="top">80,048 (94.2)</td><td align="left" valign="top">34,340 (94.1)</td><td align="left" valign="top">114,388 (94.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003; African American</td><td align="left" valign="top">3223 (3.8)</td><td align="left" valign="top">1433 (3.9)</td><td align="left" valign="top">4656 (3.8)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003; Southeast Asian</td><td align="left" valign="top">508 (0.6)</td><td align="left" valign="top">213 (0.6)</td><td align="left" valign="top">721 (0.6)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003; Northeast Asian</td><td align="left" valign="top">64 (0.1)</td><td align="left" valign="top">27 (0.1)</td><td align="left" valign="top">91 (0.1)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003; Other</td><td align="left" valign="top">1172 (1.4)</td><td align="left" valign="top">468 (1.3)</td><td align="left" valign="top">1640 (1.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">Height (m), median (IQR)</td><td align="left" valign="top">1.7 (0.5-2.2)</td><td align="left" valign="top">1.7 (0.2-2.0)</td><td align="left" valign="top">1.7 (0.2-2.2)</td><td align="left" valign="top">.001</td></tr><tr><td align="left" valign="top">Weight (kg), median (IQR)</td><td align="left" valign="top">82.8 (7.8-253.4)</td><td align="left" valign="top">82.9 (12.9-400.0)</td><td align="left" valign="top">82.8 (7.8, 400.0)</td><td align="left" valign="top">.001</td></tr><tr><td align="left" valign="top" colspan="4">ATS<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> Pattern, n (%)</td><td align="left" valign="top">.007</td></tr><tr><td align="left" valign="top">&#x2003; Normal</td><td align="left" valign="top">33,150 (41.2)</td><td align="left" valign="top">14,346 (41.6)</td><td align="left" valign="top">47,496 (41.3)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003; Obstruction</td><td align="left" valign="top">16,810 (20.9)</td><td align="left" valign="top">7173 (20.8)</td><td align="left" valign="top">23,983 (20.9)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003; Restriction</td><td align="left" valign="top">19,856 (24.7)</td><td align="left" valign="top">8482 (24.6)</td><td align="left" valign="top">28,338 (24.7)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003; Mixed defect</td><td align="left" valign="top">10,611 (13.2)</td><td align="left" valign="top">4512 (13.1)</td><td align="left" valign="top">15,123 (13.2)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="5">PFT<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup> measures, median (IQR)</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;FEV1<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">2.0 (0.2-6.8)</td><td align="left" valign="top">2.0 (0.2-6.1)</td><td align="left" valign="top">2.0 (0.2-6.8)</td><td align="left" valign="top">.005</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;FVC<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">2.9 (0.3-8.8)</td><td align="left" valign="top">2.9 (0.5-8.3)</td><td align="left" valign="top">2.9 (0.3-8.8)</td><td align="left" valign="top">.004</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;FEV1/FVC<sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup></td><td align="left" valign="top">71.6 (16.2-100.0)</td><td align="left" valign="top">71.5 (16.2-100.0)</td><td align="left" valign="top">71.6 (16.2-100.0)</td><td align="left" valign="top">.002</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;PEF<sup><xref ref-type="table-fn" rid="table1fn6">f</xref></sup></td><td align="left" valign="top">6.1 (0.7-18.8)</td><td align="left" valign="top">6.2 (0.6-17.5)</td><td align="left" valign="top">6.2 (0.6-18.8)</td><td align="left" valign="top">.001</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;VC (Spiro)<sup><xref ref-type="table-fn" rid="table1fn7">g</xref></sup></td><td align="left" valign="top">2.9 (0.3-8.8)</td><td align="left" valign="top">2.9 (0.5-8.3)</td><td align="left" valign="top">2.9 (0.3-8.8)</td><td align="left" valign="top">.004</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;RV<sup><xref ref-type="table-fn" rid="table1fn8">h</xref></sup></td><td align="left" valign="top">2.3 (0.0-11.8)</td><td align="left" valign="top">2.3 (0.1-10.4)</td><td align="left" valign="top">2.3 (0.0-11.8)</td><td align="left" valign="top">.003</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;TLC<sup><xref ref-type="table-fn" rid="table1fn9">i</xref></sup></td><td align="left" valign="top">5.5 (0.9-13.9)</td><td align="left" valign="top">5.5 (1.3-13.1)</td><td align="left" valign="top">5.5 (0.9-13.9)</td><td align="left" valign="top">.004</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;RV/TLC<sup><xref ref-type="table-fn" rid="table1fn10">j</xref></sup></td><td align="left" valign="top">43.6 (1.2-90.7)</td><td align="left" valign="top">43.6 (3.4-89.7)</td><td align="left" valign="top">43.6 (1.2-90.7)</td><td align="left" valign="top">.002</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;FRC<sup><xref ref-type="table-fn" rid="table1fn11">k</xref></sup></td><td align="left" valign="top">3.2 (0.5-12.3)</td><td align="left" valign="top">3.2 (0.4-10.8)</td><td align="left" valign="top">3.2 (0.4-12.3)</td><td align="left" valign="top">.004</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;ERV<sup><xref ref-type="table-fn" rid="table1fn12">l</xref></sup></td><td align="left" valign="top">0.8 (0.0-4.4)</td><td align="left" valign="top">0.8 (0.0-4.1)</td><td align="left" valign="top">0.8 (0.0-4.4)</td><td align="left" valign="top">.003</td></tr><tr><td align="left" valign="top">&#x2003;&#x2003;VC (Pleth)<sup><xref ref-type="table-fn" rid="table1fn13">m</xref></sup></td><td align="left" valign="top">3.0 (0.3-8.8)</td><td align="left" valign="top">3.0 (0.5-8.4)</td><td align="left" valign="top">3.0 (0.3-8.8)</td><td align="left" valign="top">.003</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>ATS: American Thoracic Society.</p></fn><fn id="table1fn2"><p><sup>b</sup>Pulmonary function test.</p></fn><fn id="table1fn3"><p><sup>c</sup>FEV1: Forced expiratory volume in the first second.</p></fn><fn id="table1fn4"><p><sup>d</sup>FVC: Forced vital capacity.</p></fn><fn id="table1fn5"><p><sup>e</sup>FEV/FVC: Ratio of FEV1 to FVC (as a percentage).</p></fn><fn id="table1fn6"><p><sup>f</sup>PEF: Peak expiratory flow.</p></fn><fn id="table1fn7"><p><sup>g</sup>VC (Spiro): Vital capacity measured via spirometry.</p></fn><fn id="table1fn8"><p><sup>h</sup>RV: Residual volume.</p></fn><fn id="table1fn9"><p><sup>i</sup>TLC: Total lung capacity.</p></fn><fn id="table1fn10"><p><sup>j</sup>RV/TLC: Ratio of RV to TLC (as a percentage).</p></fn><fn id="table1fn11"><p><sup>k</sup>FRC: Functional residual capacity.</p></fn><fn id="table1fn12"><p><sup>l</sup>ERV: Expiratory reserve volume.</p></fn><fn id="table1fn13"><p><sup>m</sup>VC (Pleth): Vital capacity measured via body plethysmography.</p></fn></table-wrap-foot></table-wrap><p><xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref> stratifies the same cohort according to the ATS classification criteria for pulmonary function patterns (ie, normal, obstructive, restrictive, and mixed pattern). This stratification highlights differences in demographics and pulmonary function measures between individuals with normal, obstructive, restrictive, or mixed patterns assigned using spirometry. Predictably, spirometry measures&#x2014;including FEV1, FVC, and the FEV1/FVC ratio&#x2014;significantly differed between groups (<italic>P</italic> values&#x003C;.001), as did all phenotype-related parameters presented in the table.</p><sec id="s3-1"><title>Lung Volume Regression</title><p>The final models chosen for evaluation were selected based on the lowest RMSE values and varied minimally in type across the lung volumes of interest. XGBoost models were identified as the best approach for predicting all lung volumes except TLC, for which traditional gradient-boosted trees showed superior performance.</p><p>Model metrics were similar between the training and testing cohorts, suggesting a reasonable trade-off between overfitting and underfitting during model training (<xref ref-type="table" rid="table2">Table 2</xref>). Findings showed a strong performance overall, with relatively low RMSE and MAE values observed across all predicted lung volumes. MPE showed a negative skew across all lung volumes. However, quantile-quantile plot analyses showed that predicted values closely followed a theoretical normal distribution, with slight underprediction and overprediction of high and low values at the extremes, respectively. Paired with mean signed differences of zero&#x2014;also known as the mean bias error&#x2014;these evaluations suggest no global bias in the direction of model predictions. Instead, these skewed MPE values were the result of extreme values at the tails of the distribution. A complete breakdown of model performance metrics is presented in <xref ref-type="table" rid="table2">Table 2</xref>, with complementary prediction scatter plots in <xref ref-type="fig" rid="figure1">Figure 1</xref>. Further subgroup analysis with different ATS patterns showed relatively similar results overall and across all categories in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 2</xref>).</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Regression model performance metrics.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Variables</td><td align="left" valign="bottom" colspan="6">Training dataset</td><td align="left" valign="bottom" colspan="6">Testing dataset</td></tr><tr><td align="left" valign="bottom">Volume</td><td align="left" valign="bottom">RMSE (L)<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td><td align="left" valign="bottom">MAE<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup></td><td align="left" valign="bottom">MSD (L)<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup></td><td align="left" valign="bottom">MPE (%)<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup></td><td align="left" valign="bottom">MAPE (%)<sup><xref ref-type="table-fn" rid="table2fn5">e</xref></sup></td><td align="left" valign="bottom">RSQ<sup><xref ref-type="table-fn" rid="table2fn6">f</xref></sup></td><td align="left" valign="bottom">RMSE (L)</td><td align="left" valign="bottom">MAE</td><td align="left" valign="bottom">MSD (L)</td><td align="left" valign="bottom">MPE (%)</td><td align="left" valign="bottom">MAPE (%)</td><td align="left" valign="bottom">RSQ</td></tr></thead><tbody><tr><td align="left" valign="top">Expiratory Reserve Volume (ERV)</td><td align="left" valign="top">0.31</td><td align="left" valign="top">0.24</td><td align="left" valign="top">0</td><td align="left" valign="top">&#x2212;40.12</td><td align="left" valign="top">60.28</td><td align="left" valign="top">0.64</td><td align="left" valign="top">0.33</td><td align="left" valign="top">0.25</td><td align="left" valign="top">0.00</td><td align="left" valign="top">&#x2212;39.10</td><td align="left" valign="top">59.95</td><td align="left" valign="top">0.61</td></tr><tr><td align="left" valign="top">Functional Residual Capacity (FRC)</td><td align="left" valign="top">0.56</td><td align="left" valign="top">0.42</td><td align="left" valign="top">0</td><td align="left" valign="top">&#x2212;2.83</td><td align="left" valign="top">12.93</td><td align="left" valign="top">0.78</td><td align="left" valign="top">0.59</td><td align="left" valign="top">0.44</td><td align="left" valign="top">0.00</td><td align="left" valign="top">&#x2212;2.91</td><td align="left" valign="top">13.51</td><td align="left" valign="top">0.75</td></tr><tr><td align="left" valign="top">Residual Volume (RV)</td><td align="left" valign="top">0.54</td><td align="left" valign="top">0.40</td><td align="left" valign="top">0</td><td align="left" valign="top">&#x2212;4.86</td><td align="left" valign="top">17.29</td><td align="left" valign="top">0.73</td><td align="left" valign="top">0.56</td><td align="left" valign="top">0.41</td><td align="left" valign="top">0.00</td><td align="left" valign="top">&#x2212;4.92</td><td align="left" valign="top">17.80</td><td align="left" valign="top">0.71</td></tr><tr><td align="left" valign="top">RV / TLC</td><td align="left" valign="top">5.07</td><td align="left" valign="top">3.93</td><td align="left" valign="top">0</td><td align="left" valign="top">&#x2212;1.61</td><td align="left" valign="top">9.55</td><td align="left" valign="top">0.82</td><td align="left" valign="top">5.20</td><td align="left" valign="top">4.03</td><td align="left" valign="top">0.03</td><td align="left" valign="top">&#x2212;1.58</td><td align="left" valign="top">9.83</td><td align="left" valign="top">0.81</td></tr><tr><td align="left" valign="top">Total Lung Capacity (TLC)</td><td align="left" valign="top">0.55</td><td align="left" valign="top">0.41</td><td align="left" valign="top">0</td><td align="left" valign="top">&#x2212;1.07</td><td align="left" valign="top">7.57</td><td align="left" valign="top">0.87</td><td align="left" valign="top">0.58</td><td align="left" valign="top">0.43</td><td align="left" valign="top">0.00</td><td align="left" valign="top">&#x2212;1.10</td><td align="left" valign="top">7.92</td><td align="left" valign="top">0.85</td></tr><tr><td align="left" valign="top">Vital Capacity (VC)</td><td align="left" valign="top">0.15</td><td align="left" valign="top">0.11</td><td align="left" valign="top">0</td><td align="left" valign="top">&#x2212;0.27</td><td align="left" valign="top">3.73</td><td align="left" valign="top">0.98</td><td align="left" valign="top">0.15</td><td align="left" valign="top">0.11</td><td align="left" valign="top">0.00</td><td align="left" valign="top">&#x2212;0.33</td><td align="left" valign="top">3.91</td><td align="left" valign="top">0.98</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>Root mean squared error.</p></fn><fn id="table2fn2"><p><sup>b</sup>Mean absolute error.</p></fn><fn id="table2fn3"><p><sup>c</sup>Mean signed deviation.</p></fn><fn id="table2fn4"><p><sup>d</sup>Mean percent error.</p></fn><fn id="table2fn5"><p><sup>e</sup>Mean absolute percent error.</p></fn><fn id="table2fn6"><p><sup>f</sup>R-Squared.</p></fn></table-wrap-foot></table-wrap><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Regression scatter plots of predicted versus true lung volume measures.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v4i1e65456_fig01.png"/></fig></sec><sec id="s3-2"><title>Lung Volume Classification</title><p>Due to limitations in demographic information (ie, age and race) required for the calculation of LLN and ULN boundaries, a total of 114,377 PFTs from the regression cohort were successfully recharacterized for the development of classification models, with 34,314 PFTs reserved for model evaluation. A comparison of demographics, spirometry, and lung volumes between the training and testing data sets can be seen in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendices 5</xref> and <xref ref-type="supplementary-material" rid="app6">6</xref>. These tables mirror the factors presented in <xref ref-type="table" rid="table1">Table 1</xref>, except for the lung volume classes (normal vs abnormal), which are unique to this subset.</p><p>Similar to the regression tasks, the final classification models selected for downstream evaluation varied minimally in type across lung volumes and were selected based on the largest ROC-AUC values. Traditional gradient-boosted trees ranked best for classifying lung volume status for FRC and vital capacity. XGBoost models ranked at the top for all other lung volume classifications. Across all lung volume categories, the models demonstrated strong discriminatory capacity, as indicated by high AUC values ranging from 0.85 to 0.99 in the training dataset and 0.81 to 0.98 in the testing dataset. High accuracy scores, ranging from 0.74 to 0.93, illustrate the ability of each model to correctly classify instances overall, with sensitivity scores ranging from 0.73 to 0.93 in the testing data set, indicating the effectiveness in identifying positive cases (ie, lung volume measurements outside the expected normal range). The high NPVs (ranging from 0.84 to 0.94) highlight each model&#x2019;s ability to correctly identify normal lung volumes. The greater variation in positive predictive value across the lung volume classes (ranging from 0.35&#x2010;0.94) suggests that some models may struggle to identify positive cases correctly, relative to the larger population of normal test findings. Classification performance metrics can be found in <xref ref-type="table" rid="table3">Table 3</xref>, with complementary ROC curves in <xref ref-type="fig" rid="figure2">Figure 2</xref>.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Classification model performance metrics.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Volume</td><td align="left" valign="bottom" colspan="10">Training dataset</td><td align="left" valign="bottom" colspan="10">Testing dataset</td></tr><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">AUC<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="bottom">ACC<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup></td><td align="left" valign="bottom">SENS<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup></td><td align="left" valign="bottom">SPEC<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup></td><td align="left" valign="bottom">PPV<sup><xref ref-type="table-fn" rid="table3fn5">e</xref></sup></td><td align="left" valign="bottom">NPV<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup></td><td align="left" valign="bottom">LRT+<sup><xref ref-type="table-fn" rid="table3fn7">g</xref></sup></td><td align="left" valign="bottom">LRT-<sup><xref ref-type="table-fn" rid="table3fn8">h</xref></sup></td><td align="left" valign="bottom">OR<sup><xref ref-type="table-fn" rid="table3fn9">i</xref></sup></td><td align="left" valign="bottom">F1<sup><xref ref-type="table-fn" rid="table3fn10">j</xref></sup></td><td align="left" valign="bottom">AUC</td><td align="left" valign="bottom">ACC</td><td align="left" valign="bottom">SENS</td><td align="left" valign="bottom">SPEC</td><td align="left" valign="bottom">PPV</td><td align="left" valign="bottom">NPV</td><td align="left" valign="bottom">LRT+</td><td align="left" valign="bottom">LRT-</td><td align="left" valign="bottom">OR</td><td align="left" valign="bottom">F1</td></tr></thead><tbody><tr><td align="left" valign="top">Expiratory reserve volume (ERV)</td><td align="left" valign="top">&#x2003;0.85</td><td align="left" valign="top">&#x2003;0.76</td><td align="left" valign="top">&#x2003;0.78</td><td align="left" valign="top">&#x2003;0.76</td><td align="left" valign="top">&#x2003;0.38</td><td align="left" valign="top">&#x2003;0.95</td><td align="left" valign="top">3.24</td><td align="left" valign="top">&#x2003;0.29</td><td align="left" valign="top">&#x2003;11.23</td><td align="left" valign="top">&#x2003;0.51</td><td align="left" valign="top">&#x2003;0.81</td><td align="left" valign="top">&#x2003;0.74</td><td align="left" valign="top">&#x2003;0.73</td><td align="left" valign="top">&#x2003;0.75</td><td align="left" valign="top">&#x2003;0.35</td><td align="left" valign="top">&#x2003;0.94</td><td align="left" valign="top">&#x2003;2.87</td><td align="left" valign="top">&#x2003;0.36</td><td align="left" valign="top">&#x2003;7.95</td><td align="left" valign="top">&#x2003;0.47</td></tr><tr><td align="left" valign="top">Functional residual capacity (FRC)</td><td align="left" valign="top">&#x2003;0.88</td><td align="left" valign="top">&#x2003;0.80</td><td align="left" valign="top">&#x2003;0.79</td><td align="left" valign="top">&#x2003;0.80</td><td align="left" valign="top">&#x2003;0.58</td><td align="left" valign="top">&#x2003;0.92</td><td align="left" valign="top">&#x2003;3.99</td><td align="left" valign="top">&#x2003;0.26</td><td align="left" valign="top">&#x2003;15.16</td><td align="left" valign="top">&#x2003;0.67</td><td align="left" valign="top">&#x2003;0.84</td><td align="left" valign="top">&#x2003;0.78</td><td align="left" valign="top">&#x2003;0.75</td><td align="left" valign="top">&#x2003;0.78</td><td align="left" valign="top">&#x2003;0.55</td><td align="left" valign="top">&#x2003;0.90</td><td align="left" valign="top">&#x2003;3.48</td><td align="left" valign="top">&#x2003;0.32</td><td align="left" valign="top">&#x2003;10.90</td><td align="left" valign="top">&#x2003;0.63</td></tr><tr><td align="left" valign="top">Residual volume (RV)</td><td align="left" valign="top">&#x2003;0.90</td><td align="left" valign="top">&#x2003;0.82</td><td align="left" valign="top">&#x2003;0.80</td><td align="left" valign="top">&#x2003;0.83</td><td align="left" valign="top">&#x2003;0.60</td><td align="left" valign="top">&#x2003;0.93</td><td align="left" valign="top">&#x2003;4.70</td><td align="left" valign="top">&#x2003;0.24</td><td align="left" valign="top">&#x2003;19.89</td><td align="left" valign="top">&#x2003;0.69</td><td align="left" valign="top">&#x2003;0.87</td><td align="left" valign="top">&#x2003;0.80</td><td align="left" valign="top">&#x2003;0.76</td><td align="left" valign="top">&#x2003;0.81</td><td align="left" valign="top">&#x2003;0.56</td><td align="left" valign="top">&#x2003;0.91</td><td align="left" valign="top">&#x2003;4.01</td><td align="left" valign="top">&#x2003;0.30</td><td align="left" valign="top">&#x2003;13.40</td><td align="left" valign="top">&#x2003;0.65</td></tr><tr><td align="left" valign="top">RV/TLC (%)</td><td align="left" valign="top">&#x2003;0.91</td><td align="left" valign="top">&#x2003;0.82</td><td align="left" valign="top">&#x2003;0.82</td><td align="left" valign="top">&#x2003;0.83</td><td align="left" valign="top">&#x2003;0.78</td><td align="left" valign="top">&#x2003;0.86</td><td align="left" valign="top">&#x2003;4.77</td><td align="left" valign="top">&#x2003;0.22</td><td align="left" valign="top">&#x2003;21.60</td><td align="left" valign="top">&#x2003;0.80</td><td align="left" valign="top">&#x2003;0.90</td><td align="left" valign="top">&#x2003;0.81</td><td align="left" valign="top">&#x2003;0.80</td><td align="left" valign="top">&#x2003;0.82</td><td align="left" valign="top">&#x2003;0.78</td><td align="left" valign="top">&#x2003;0.84</td><td align="left" valign="top">&#x2003;4.43</td><td align="left" valign="top">&#x2003;0.24</td><td align="left" valign="top">&#x2003;18.52</td><td align="left" valign="top">&#x2003;0.79</td></tr><tr><td align="left" valign="top">Total lung capacity (TLC)</td><td align="left" valign="top">&#x2003;0.93</td><td align="left" valign="top">&#x2003;0.85</td><td align="left" valign="top">&#x2003;0.84</td><td align="left" valign="top">&#x2003;0.85</td><td align="left" valign="top">&#x2003;0.73</td><td align="left" valign="top">&#x2003;0.92</td><td align="left" valign="top">&#x2003;5.71</td><td align="left" valign="top">&#x2003;0.19</td><td align="left" valign="top">&#x2003;30.77</td><td align="left" valign="top">&#x2003;0.78</td><td align="left" valign="top">&#x2003;0.89</td><td align="left" valign="top">&#x2003;0.82</td><td align="left" valign="top">&#x2003;0.79</td><td align="left" valign="top">&#x2003;0.83</td><td align="left" valign="top">&#x2003;0.69</td><td align="left" valign="top">&#x2003;0.89</td><td align="left" valign="top">&#x2003;4.70</td><td align="left" valign="top">&#x2003;0.25</td><td align="left" valign="top">&#x2003;18.86</td><td align="left" valign="top">&#x2003;0.74</td></tr><tr><td align="left" valign="top">Vital capacity (VC)</td><td align="left" valign="top">&#x2003;0.99</td><td align="left" valign="top">&#x2003;0.95</td><td align="left" valign="top">&#x2003;0.95</td><td align="left" valign="top">&#x2003;0.94</td><td align="left" valign="top">&#x2003;0.95</td><td align="left" valign="top">&#x2003;0.94</td><td align="left" valign="top">&#x2003;16.59</td><td align="left" valign="top">&#x2003;0.05</td><td align="left" valign="top">&#x2003;309.54</td><td align="left" valign="top">&#x2003;0.95</td><td align="left" valign="top">&#x2003;0.98</td><td align="left" valign="top">&#x2003;0.93</td><td align="left" valign="top">&#x2003;0.93</td><td align="left" valign="top">&#x2003;0.92</td><td align="left" valign="top">&#x2003;0.94</td><td align="left" valign="top">&#x2003;0.91</td><td align="left" valign="top">&#x2003;12.13</td><td align="left" valign="top">&#x2003;0.08</td><td align="left" valign="top">&#x2003;160.18</td><td align="left" valign="top">&#x2003;0.93</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>AUC: area under the receiver operating curve.</p></fn><fn id="table3fn2"><p><sup>b</sup>ACC: accuracy.</p></fn><fn id="table3fn3"><p><sup>c</sup>SENS: sensitivity.</p></fn><fn id="table3fn4"><p><sup>d</sup>SPEC: specificity.</p></fn><fn id="table3fn5"><p><sup>e</sup>PPV: positive predictive value.</p></fn><fn id="table3fn6"><p><sup>f</sup>NPV: negative predictive value.</p></fn><fn id="table3fn7"><p><sup>g</sup>LRT+: likelihood ratio test+.</p></fn><fn id="table3fn8"><p><sup>h</sup>LRT&#x2013;: likelihood ratio test-.</p></fn><fn id="table3fn9"><p><sup>i</sup>OR: odds ratio.</p></fn><fn id="table3fn10"><p><sup>j</sup>F1: F1-score.</p></fn></table-wrap-foot></table-wrap><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Classification receiver operating characteristic (ROC) curves.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v4i1e65456_fig02.png"/></fig><p>When stratified by PFT patterns, unique strengths, and weaknesses were observed across subgroups (<xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref>). These variations can be attributed to the limitations of the training data, feature space, and models, while others were driven by the rarity of certain lung volume abnormalities in specific spirometry-defined patterns. For instance, in classifying ERV status&#x2014;arguably the most challenging lung volume explored in this study&#x2014;the model showed consistently high NPVs across all spirometry pattern types, highlighting general confidence in predicting normal lung volume status. However, it achieved notably better sensitivity in the &#x201C;restriction&#x201D; and &#x201C;mixed pattern&#x201D; subsets (0.91 and 0.75). Comparing these sensitivities and other metrics to those in the &#x201C;normal&#x201D; and &#x201C;obstruction&#x201D; subgroups, the model seems to struggle to detect positive cases in patients with normal or obstructive spirometry findings.</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><p>The development of ML models to predict lung volume status (normal vs abnormal findings) from spirometry in over 110,000 patients has yielded highly encouraging results, displaying remarkable discriminatory power with high AUC values (0.81&#x2010;0.95) across measured lung volumes. Estimates of FRC, TLC, RV, and the RV/TLC ratio status show strong sensitivity and specificity. These metrics remain largely consistent across spirometry-defined pattern subgroups, with a few exceptions that can generally be attributed to the rarity of abnormal lung volume measures in certain spirometry patterns. The ability to predict lung volume measures without having to perform extensive testing represents a promising innovation for improving the diagnosis and management of dyspnea and chronic respiratory diseases, particularly in the primary care setting [<xref ref-type="bibr" rid="ref16">16</xref>]. The strong predictive performance of lung volume measurement underscores the potential of these models as a transformative tool in respiratory medicine, offering substantial clinical implications and opportunities for enhancing patient care.</p><p>The performance of the regression models showed a high correlation between the training and testing datasets, suggesting that the models were able to effectively capture the relationship between spirometry-derived features and measured lung volumes and capacities derived from body plethysmography. The effectiveness of the models was evident in their ability to closely approximate lung volumes with minimal deviation from true values on average. The RMSE and MAE values are low relative to their respective lung volume ranges. For instance, the median TLC measure in the cohort was 5.5 L, with the model attaining an MAE of 0.43 L and an MAPE of 7.92%. The ability to accurately estimate the RV/TLC ratio further highlights the potential of these models in capturing the dynamic interplay between these volumes, which is particularly relevant in differentiating between common lung conditions such as COPD, asthma, and restrictive lung diseases [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref20">20</xref>]. The high R-squared values observed for TLC (0.87 in the training set and 0.85 in the testing set) underscore the model&#x2019;s capacity to capture a significant portion of the variance in TLC measurement. Similarly, the robust estimation of RV (R-squared of 0.73 in the training set and 0.71 in the testing set) and FRC (R-squared of 0.78 in the training set and 0.75 in the testing set) further validates model reliability in estimating lung volumes crucial for the evaluation of respiratory function. The model demonstrated a high correlation for vital capacity (<italic>R</italic><sup>2</sup>=0.98). However, this finding is misleading, as spirometry already provides an accurate estimate of vital capacity, making it trivial to map to a similar value obtained via body plethysmography, assuming minimal measurement error and consistent effort on the part of the patient when executing breathing maneuvers. A significant change in TLC has been reported to be 10% over one year, whereas this model was able to predict TLC within 7.5% and 550 mL [<xref ref-type="bibr" rid="ref10">10</xref>]. No significant changes were reported in FRC or RV over time. Considering the performance metrics as a whole, the potential of these models to augment clinical practice is encouraging, with R-squared values exceeding 0.7 for all volumes except ERV, which seems to be the most challenging volume to predict accurately. Estimation of TLC, RV, and their ratio (RV/TLC) is particularly promising, as the accurate estimation of the RV/TLC ratio facilitates the identification of air trapping and hyperinflation, which are key factors in many patients&#x2019; symptomatology [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref20">20</xref>]. Moreover, the reasonable estimation of FRC suggests its potential utility as an indicator for restrictive lung disease diagnosis and treatment. This is particularly important as body plethysmography directly measures only FRC, which is then used to calculate the other variables.</p><p>Focusing on the estimation of ERV, the notably high MAPE indicates a relatively subpar overall performance. Given that ERV has the narrowest range of measured values (ie, median 0.8 L, (IQR 0-44) L and a large RMSE of 0.31 relative to the ERV range, this elevated MAPE may be partially influenced by the smaller margin for error [<xref ref-type="bibr" rid="ref21">21</xref>]. ERV measures the volume of air that an individual can exhale after completing a normal tidal breath. Pairing this with spirometry, individuals with a higher ERV may experience more difficulty with exhalation or exhibit an obstructive pattern on spirometry with a lower FEV1 measure [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. A higher ERV could be a sign of lung hyperinflation, while other factors like obesity, pregnancy, and significant ascites can decrease ERV [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. Lung hyperinflation in obstructed patients, which is defined as elevated FRC, RV, RV/TLC, or occasionally ERV, is highly variable in patients and occurs inconsistently over time [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. This inconsistency, combined with ERV&#x2019;s narrow range, makes it challenging to predict.</p><p>Highlighting a more robust model, predictions for the RV/TLC ratio are strong overall, with AUC values ranging from 0.8 to 0.86 across all patterns and 0.91 in the full cohort. Except for normal pattern PFTs, the model consistently achieved sensitivities &#x003E;0.84, but it struggled to identify positive cases in normal spirometry tests. While spirometry alone does not directly measure RV or TLC, FEV1 and FVC can indirectly reflect changes in lung volumes. In obstructive lung diseases, a reduction in FEV1/FVC ratio combined with an increase in the RV/TLC ratio often indicates air trapping [<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref25">25</xref>]. In restrictive diseases, such as pulmonary fibrosis, spirometry may show decreased FVC with a preserved or decreased RV/TLC ratio, suggesting reduced air trapping [<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref25">25</xref>]. Given the absence of abnormal FEV1 and FVC values, normal spirometry patterns would not usually suggest the existence of an abnormal RV/TLC ratio, potentially explaining the reduced sensitivity to predicting abnormal RV/TLC in normal spirometry.</p><p>A previous study used a CatBoost model to predict the TLC from spirometry, yielding good results [<xref ref-type="bibr" rid="ref7">7</xref>]. The study reports an MSE of 560.1 mL for TLC and a positive predictive value for reduced TLC of 8% or 67%, depending on the model parameters. However, this study only focused on TLC and did not assess other pulmonary physiologic parameters obtained through lung volume measurements, such as FRC and RV. These parameters are necessary as they are crucial for assessing prognosis in various respiratory diseases [<xref ref-type="bibr" rid="ref26">26</xref>-<xref ref-type="bibr" rid="ref30">30</xref>].</p><p>Several studies have highlighted the importance of lung volume assessments for the diagnosis and prognosis of respiratory diseases [<xref ref-type="bibr" rid="ref31">31</xref>]. In routine practice, it can aid in the early detection, diagnosis, and monitoring of respiratory conditions such as COPD, restrictive lung diseases, and neuromuscular disorders affecting respiratory function [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>]. For instance, lung volume measurements (specifically, FRC and TLC) strongly correlate with mortality risk among patients with idiopathic pulmonary fibrosis [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. This illustrates that the prediction of lung volumes from traditional spirometry holds substantial promise in clinical scenarios where lung volume measurements cannot be directly performed, such as primary care offices, or health care facilities in rural areas where the equipment for measuring lung volumes is not readily accessible. Another scenario is when a patient is not capable of physically performing lung volume measurements, which could involve physical conditions that prevent them or any number of other limitations that could potentially limit them. Additionally, it may facilitate personalized treatment plans by providing a more nuanced understanding of a patient&#x2019;s lung capacities, as lung volume measurements are typically performed only after a patient is determined to have an abnormal spirometry, unless in specialized centers.</p><p>Accurate assessment of lung volumes is pivotal in diagnosing and monitoring various respiratory conditions, including COPD, interstitial lung diseases, neuromuscular disorders, and restrictive lung diseases [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. If lung volume measurements are not performed, vital capacity is often used as a surrogate [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. However, there is a significant error in the application of this method, as a reduced vital capacity can be seen in restrictive lung disease and obstructive lung disease with increased residual volume [<xref ref-type="bibr" rid="ref36">36</xref>]. A restrictive defect on lung volume measurements has rarely been seen occurring with normal vital capacity, and approximately 58% of the time with low vital capacity measurements [<xref ref-type="bibr" rid="ref36">36</xref>]. Another study showed that when forced vital capacity &#x003E;100% predicted in males or &#x003E;85% predicted in females ruled out a restrictive pattern on lung volumes [<xref ref-type="bibr" rid="ref37">37</xref>]. The use of direct lung volume prediction models, such as those developed in this study, have a significantly better performance than those used in these prior studies and could reduce the frequency of clinical scenarios where lung volumes are unknown.</p><p>The AI model&#x2019;s ability to estimate lung volumes from readily available spirometry data streamlines these diagnostic procedures. A typical spirometry test may take approximately 30&#x2010;45 minutes, while lung volume measurements add another 15&#x2010;30 minutes [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref39">39</xref>]. Replacing or complementing traditional, more resource-intensive lung volume measurement techniques with the AI model&#x2019;s predictions from spirometry data offers cost-effective alternatives. The physician fee for spirometry ranges from $29.62 to $150.68, depending upon the medications used, while measuring lung volumes adds another $59.98 to the cost [<xref ref-type="bibr" rid="ref40">40</xref>]. This approach optimizes healthcare resources, reduces patient burden associated with additional tests, and potentially increases the efficiency of healthcare delivery.</p><p>The accessibility of spirometry in various healthcare settings, coupled with the estimation of both lung volumes via the developed models, opens avenues for telemedicine applications. Remote monitoring and assessment of spirometry are already being performed and could be facilitated and enhanced with automated decision support systems utilizing models such as those developed in this study [<xref ref-type="bibr" rid="ref41">41</xref>-<xref ref-type="bibr" rid="ref43">43</xref>]. Such strategies could enable the continuous monitoring of patients with chronic respiratory conditions that affect lung volumes [<xref ref-type="bibr" rid="ref41">41</xref>-<xref ref-type="bibr" rid="ref43">43</xref>]. This aligns with the evolving landscape of telemedicine, emphasizing its potential in respiratory care.</p><p>Despite the remarkable performance of the predictive models, certain limitations warrant consideration. Model training and testing relied on datasets with potential biases in demographic variables, including a majority-White population (91%) of older adults (median age 64.7) years. These factors potentially limit the generalizability to diverse populations, although this model was developed with patients of all ages from two distinct regions of the United States (Midwest and Southeast). Further validation across broader demographic groups from various clinical settings is essential to establish widespread applicability and reliability. Moreover, continuous refinement and validation of the models using larger datasets encompassing a broader spectrum of respiratory conditions and disease severities is imperative. This iterative process would enhance model performance while preventing model drift, ensuring its efficacy in diverse clinical scenarios even as standard clinical practices are updated or changed.</p><p>In conclusion, the development of AI models for predicting lung volumes from spirometry represents an advancement in pulmonary function assessment. The remarkable sensitivity and specificity offered by the classification models affect a transformative approach to complement traditional lung volume measurement techniques. While the regression models may not attain the same level of performance, the continuous nature of their estimates provides a unique addition to supplement and contextualize binary classifications, potentially elucidating new insights into the remote monitoring of pulmonary function. If integrated into clinical practice, these models hold the promise of revolutionizing respiratory care, enabling more comprehensive and accessible assessments of lung function, and ultimately improving patient outcomes. Overall, the models demonstrate robust performance across lung volume measurements, underscoring their potential utility in clinical practice for accurate diagnosis and prognosis of respiratory conditions in locations where access to body plethysmography or other lung volume measurement modalities is challenging..</p></sec></body><back><ack><p>This publication was made possible through the support of the Walter and Leonare Annenberg Career Development Award in Pulmonary Medicine (2 of 2).</p></ack><fn-group><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations:</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">AUC</term><def><p>area under the receiver-operating-characteristic curve</p></def></def-item><def-item><term id="abb3">COPD</term><def><p>chronic obstructive pulmonary disease</p></def></def-item><def-item><term id="abb4">ERV</term><def><p>expiratory reserve volume</p></def></def-item><def-item><term id="abb5">FEV1</term><def><p>forced expiratory volume in the first second of exhalation</p></def></def-item><def-item><term id="abb6">FEV1/FVC</term><def><p>ratio of FEV1 and FVC</p></def></def-item><def-item><term id="abb7">FRC</term><def><p>functional residual volume</p></def></def-item><def-item><term id="abb8">FVC</term><def><p>forced vital capacity</p></def></def-item><def-item><term id="abb9">LLN</term><def><p>lower limit of normal</p></def></def-item><def-item><term id="abb10">LRT+</term><def><p>positive likelihood ratio</p></def></def-item><def-item><term id="abb11">LRT-</term><def><p>negative likelihood ratio</p></def></def-item><def-item><term id="abb12">MAE</term><def><p>mean absolute error</p></def></def-item><def-item><term id="abb13">MAPE</term><def><p>mean absolute percentage error</p></def></def-item><def-item><term id="abb14">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb15">MPE</term><def><p>mean percentage error</p></def></def-item><def-item><term id="abb16">NPV</term><def><p>negative predictive value</p></def></def-item><def-item><term id="abb17">PFT</term><def><p>pulmonary function test</p></def></def-item><def-item><term id="abb18">PPV</term><def><p>positive predictive value</p></def></def-item><def-item><term id="abb19">RMSE</term><def><p>root mean squared error</p></def></def-item><def-item><term id="abb20">RV</term><def><p>residual volume</p></def></def-item><def-item><term id="abb21">RV/TLC</term><def><p>ratio of residual volume to total lung capacity</p></def></def-item><def-item><term id="abb22">SPEC</term><def><p>specificity</p></def></def-item><def-item><term id="abb23">TLC</term><def><p>total lung capacity</p></def></def-item><def-item><term id="abb24">ULN</term><def><p>upper limit of normal</p></def></def-item><def-item><term id="abb25">VC</term><def><p>vital capacity</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hall</surname><given-names>GL</given-names> </name><name name-style="western"><surname>Filipow</surname><given-names>N</given-names> </name><name name-style="western"><surname>Ruppel</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Official ERS technical standard: Global Lung Function Initiative reference values for static lung volumes in individuals of European ancestry</article-title><source>Eur Respir J</source><year>2021</year><month>03</month><volume>57</volume><issue>3</issue><fpage>2000289</fpage><pub-id pub-id-type="doi">10.1183/13993003.00289-2020</pub-id><pub-id pub-id-type="medline">33707167</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Crapo</surname><given-names>RO</given-names> </name></person-group><article-title>Pulmonary-function testing</article-title><source>N Engl J Med</source><year>1994</year><month>07</month><day>7</day><volume>331</volume><issue>1</issue><fpage>25</fpage><lpage>30</lpage><pub-id pub-id-type="doi">10.1056/NEJM199407073310107</pub-id><pub-id pub-id-type="medline">8202099</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>O&#x2019;Donnell</surname><given-names>DE</given-names> </name><name name-style="western"><surname>Milne</surname><given-names>KM</given-names> </name><name name-style="western"><surname>Vincent</surname><given-names>SG</given-names> </name><name name-style="western"><surname>Neder</surname><given-names>JA</given-names> </name></person-group><article-title>Unraveling the causes of unexplained dyspnea: the value of exercise testing</article-title><source>Clin Chest Med</source><year>2019</year><month>06</month><volume>40</volume><issue>2</issue><fpage>471</fpage><lpage>499</lpage><pub-id pub-id-type="doi">10.1016/j.ccm.2019.02.014</pub-id><pub-id pub-id-type="medline">31078223</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ruppel</surname><given-names>GL</given-names> </name></person-group><article-title>What is the clinical value of lung volumes?</article-title><source>Respir Care</source><year>2012</year><month>01</month><volume>57</volume><issue>1</issue><fpage>26</fpage><lpage>35</lpage><pub-id pub-id-type="doi">10.4187/respcare.01374</pub-id><pub-id pub-id-type="medline">22222123</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ip</surname><given-names>A</given-names> </name><name name-style="western"><surname>Asamoah-Barnieh</surname><given-names>R</given-names> </name><name name-style="western"><surname>Bischak</surname><given-names>DP</given-names> </name><name name-style="western"><surname>Davidson</surname><given-names>WJ</given-names> </name><name name-style="western"><surname>Flemons</surname><given-names>WW</given-names> </name><name name-style="western"><surname>Pendharkar</surname><given-names>SR</given-names> </name></person-group><article-title>Using operational analysis to improve access to pulmonary function testing</article-title><source>Can Respir J</source><year>2016</year><volume>2016</volume><fpage>5269374</fpage><pub-id pub-id-type="doi">10.1155/2016/5269374</pub-id><pub-id pub-id-type="medline">27445545</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sassi-Dambron</surname><given-names>DE</given-names> </name><name name-style="western"><surname>Eakin</surname><given-names>EG</given-names> </name><name name-style="western"><surname>Ries</surname><given-names>AL</given-names> </name><name name-style="western"><surname>Kaplan</surname><given-names>RM</given-names> </name></person-group><article-title>Treatment of dyspnea in COPD. A controlled clinical trial of dyspnea management strategies</article-title><source>Chest</source><year>1995</year><month>03</month><volume>107</volume><issue>3</issue><fpage>724</fpage><lpage>729</lpage><pub-id pub-id-type="doi">10.1378/chest.107.3.724</pub-id><pub-id pub-id-type="medline">7874944</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Beverin</surname><given-names>L</given-names> </name><name name-style="western"><surname>Topalovic</surname><given-names>M</given-names> </name><name name-style="western"><surname>Halilovic</surname><given-names>A</given-names> </name><name name-style="western"><surname>Desbordes</surname><given-names>P</given-names> </name><name name-style="western"><surname>Janssens</surname><given-names>W</given-names> </name><name name-style="western"><surname>De Vos</surname><given-names>M</given-names> </name></person-group><article-title>Predicting total lung capacity from spirometry: a machine learning approach</article-title><source>Front Med (Lausanne)</source><year>2023</year><volume>10</volume><fpage>1174631</fpage><pub-id pub-id-type="doi">10.3389/fmed.2023.1174631</pub-id><pub-id pub-id-type="medline">37275373</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hedenstierna</surname><given-names>G</given-names> </name><name name-style="western"><surname>Rothen</surname><given-names>HU</given-names> </name></person-group><article-title>Atelectasis formation during anesthesia: causes and measures to prevent it</article-title><source>J Clin Monit Comput</source><year>2000</year><volume>16</volume><issue>5-6</issue><fpage>329</fpage><lpage>335</lpage><pub-id pub-id-type="doi">10.1023/a:1011491231934</pub-id><pub-id pub-id-type="medline">12580216</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Evankovich</surname><given-names>JW</given-names> </name><name name-style="western"><surname>Nouraie</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Sciurba</surname><given-names>FC</given-names> </name></person-group><article-title>A model to predict residual volume from forced spirometry measurements in chronic obstructive pulmonary disease</article-title><source>Chronic Obstr Pulm Dis</source><year>2023</year><month>01</month><day>25</day><volume>10</volume><issue>1</issue><fpage>55</fpage><lpage>63</lpage><pub-id pub-id-type="doi">10.15326/jcopdf.2022.0354</pub-id><pub-id pub-id-type="medline">36563054</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Stanojevic</surname><given-names>S</given-names> </name><name name-style="western"><surname>Kaminsky</surname><given-names>DA</given-names> </name><name name-style="western"><surname>Miller</surname><given-names>MR</given-names> </name><etal/></person-group><article-title>ERS/ATS technical standard on interpretive strategies for routine lung function tests</article-title><source>Eur Respir J</source><year>2022</year><month>07</month><volume>60</volume><issue>1</issue><fpage>2101499</fpage><pub-id pub-id-type="doi">10.1183/13993003.01499-2021</pub-id><pub-id pub-id-type="medline">34949706</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Quanjer</surname><given-names>PH</given-names> </name><name name-style="western"><surname>Stanojevic</surname><given-names>S</given-names> </name><name name-style="western"><surname>Cole</surname><given-names>TJ</given-names> </name><etal/></person-group><article-title>Multi-ethnic reference values for spirometry for the 3-95-yr age range: the global lung function 2012 equations</article-title><source>Eur Respir J</source><year>2012</year><month>12</month><volume>40</volume><issue>6</issue><fpage>1324</fpage><lpage>1343</lpage><pub-id pub-id-type="doi">10.1183/09031936.00080312</pub-id><pub-id pub-id-type="medline">22743675</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Stanojevic</surname><given-names>S</given-names> </name><name name-style="western"><surname>Graham</surname><given-names>BL</given-names> </name><name name-style="western"><surname>Cooper</surname><given-names>BG</given-names> </name><etal/></person-group><article-title>Official ERS technical standards: Global Lung Function Initiative reference values for the carbon monoxide transfer factor for Caucasians</article-title><source>Eur Respir J</source><year>2017</year><month>09</month><volume>50</volume><issue>3</issue><fpage>1700010</fpage><pub-id pub-id-type="doi">10.1183/13993003.00010-2017</pub-id><pub-id pub-id-type="medline">28893868</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>T</given-names> </name><name name-style="western"><surname>Guestrin</surname><given-names>C</given-names> </name></person-group><article-title>XGBoost: A scalable tree boosting system</article-title><conf-name>Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name><conf-date>Aug 13-17, 2016</conf-date><conf-loc>San Francisco California USA</conf-loc><fpage>785</fpage><lpage>794</lpage></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Kuhn</surname><given-names>MVD</given-names> </name><name name-style="western"><surname>Hvitfeldt</surname><given-names>E</given-names> </name></person-group><article-title>Yardstick: tidy characterizations of model performance. R package version 1.3.1 2024</article-title><access-date>2025-03-12</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://yardstick.tidymodels.org">https://yardstick.tidymodels.org</ext-link></comment></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>LeDell</surname><given-names>E</given-names> </name><name name-style="western"><surname>Poirier</surname><given-names>S</given-names> </name></person-group><article-title>H2O automl: scalable automatic machine learning</article-title><year>2020</year><month>07</month><day>18</day><access-date>2025-03-12</access-date><conf-name>Proceedings of the AutoML Workshop at ICML</conf-name><comment><ext-link ext-link-type="uri" xlink:href="https://api.semanticscholar.org/CorpusID:221338558">https://api.semanticscholar.org/CorpusID:221338558</ext-link></comment></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Budhwar</surname><given-names>N</given-names> </name><name name-style="western"><surname>Syed</surname><given-names>Z</given-names> </name></person-group><article-title>Chronic dyspnea: diagnosis and evaluation</article-title><source>Am Fam Physician</source><year>2020</year><month>05</month><day>1</day><volume>101</volume><issue>9</issue><fpage>542</fpage><lpage>548</lpage><pub-id pub-id-type="medline">32352727</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Casanova</surname><given-names>C</given-names> </name><name name-style="western"><surname>Cote</surname><given-names>C</given-names> </name><name name-style="western"><surname>de Torres</surname><given-names>JP</given-names> </name><etal/></person-group><article-title>Inspiratory-to-total lung capacity ratio predicts mortality in patients with chronic obstructive pulmonary disease</article-title><source>Am J Respir Crit Care Med</source><year>2005</year><month>03</month><day>15</day><volume>171</volume><issue>6</issue><fpage>591</fpage><lpage>597</lpage><pub-id pub-id-type="doi">10.1164/rccm.200407-867OC</pub-id><pub-id pub-id-type="medline">15591470</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Marin</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Carrizo</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Gascon</surname><given-names>M</given-names> </name><name name-style="western"><surname>Sanchez</surname><given-names>A</given-names> </name><name name-style="western"><surname>Gallego</surname><given-names>B</given-names> </name><name name-style="western"><surname>Celli</surname><given-names>BR</given-names> </name></person-group><article-title>Inspiratory capacity, dynamic hyperinflation, breathlessness, and exercise performance during the 6-minute-walk test in chronic obstructive pulmonary disease</article-title><source>Am J Respir Crit Care Med</source><year>2001</year><month>05</month><volume>163</volume><issue>6</issue><fpage>1395</fpage><lpage>1399</lpage><pub-id pub-id-type="doi">10.1164/ajrccm.163.6.2003172</pub-id><pub-id pub-id-type="medline">11371407</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>O&#x2019;Donnell</surname><given-names>DE</given-names> </name><name name-style="western"><surname>Webb</surname><given-names>KA</given-names> </name></person-group><article-title>Exertional breathlessness in patients with chronic airflow limitation. The role of lung hyperinflation</article-title><source>Am Rev Respir Dis</source><year>1993</year><month>11</month><volume>148</volume><issue>5</issue><fpage>1351</fpage><lpage>1357</lpage><pub-id pub-id-type="doi">10.1164/ajrccm/148.5.1351</pub-id><pub-id pub-id-type="medline">8239175</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shin</surname><given-names>TR</given-names> </name><name name-style="western"><surname>Oh</surname><given-names>YM</given-names> </name><name name-style="western"><surname>Park</surname><given-names>JH</given-names> </name><etal/></person-group><article-title>The prognostic value of residual volume/total lung capacity in patients with chronic obstructive pulmonary disease</article-title><source>J Korean Med Sci</source><year>2015</year><month>10</month><volume>30</volume><issue>10</issue><fpage>1459</fpage><lpage>1465</lpage><pub-id pub-id-type="doi">10.3346/jkms.2015.30.10.1459</pub-id><pub-id pub-id-type="medline">26425043</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Makridakis</surname><given-names>S</given-names> </name></person-group><article-title>Accuracy measures: theoretical and practical concerns</article-title><source>Int J Forecast</source><year>1993</year><month>12</month><volume>9</volume><issue>4</issue><fpage>527</fpage><lpage>529</lpage><pub-id pub-id-type="doi">10.1016/0169-2070(93)90079-3</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Quanjer</surname><given-names>PH</given-names> </name><name name-style="western"><surname>Tammeling</surname><given-names>GJ</given-names> </name><name name-style="western"><surname>Cotes</surname><given-names>JE</given-names> </name><name name-style="western"><surname>Pedersen</surname><given-names>OF</given-names> </name><name name-style="western"><surname>Peslin</surname><given-names>R</given-names> </name><name name-style="western"><surname>Yernault</surname><given-names>JC</given-names> </name></person-group><article-title>Lung volumes and forced ventilatory flows</article-title><source>Eur Respir J</source><year>1993</year><month>03</month><day>1</day><volume>6</volume><issue>Suppl 16</issue><fpage>5</fpage><lpage>40</lpage><pub-id pub-id-type="doi">10.1183/09041950.005s1693</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Papandrinopoulou</surname><given-names>D</given-names> </name><name name-style="western"><surname>Tzouda</surname><given-names>V</given-names> </name><name name-style="western"><surname>Tsoukalas</surname><given-names>G</given-names> </name></person-group><article-title>Lung compliance and chronic obstructive pulmonary disease</article-title><source>Pulm Med</source><year>2012</year><volume>2012</volume><fpage>542769</fpage><pub-id pub-id-type="doi">10.1155/2012/542769</pub-id><pub-id pub-id-type="medline">23150821</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>O&#x2019;Donnell</surname><given-names>DE</given-names> </name><name name-style="western"><surname>Laveneziana</surname><given-names>P</given-names> </name></person-group><article-title>Physiology and consequences of lung hyperinflation in COPD</article-title><source>Eur Respir Rev</source><year>2006</year><month>12</month><volume>15</volume><issue>100</issue><fpage>61</fpage><lpage>67</lpage><pub-id pub-id-type="doi">10.1183/09059180.00010002</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Leith</surname><given-names>DE</given-names> </name><name name-style="western"><surname>Brown</surname><given-names>R</given-names> </name></person-group><article-title>Human lung volumes and the mechanisms that set them</article-title><source>Eur Respir J</source><year>1999</year><month>02</month><volume>13</volume><issue>2</issue><fpage>468</fpage><lpage>472</lpage><pub-id pub-id-type="doi">10.1183/09031936.99.13246899</pub-id><pub-id pub-id-type="medline">10065702</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Budweiser</surname><given-names>S</given-names> </name><name name-style="western"><surname>Harlacher</surname><given-names>M</given-names> </name><name name-style="western"><surname>Pfeifer</surname><given-names>M</given-names> </name><name name-style="western"><surname>J&#x00F6;rres</surname><given-names>RA</given-names> </name></person-group><article-title>Co-morbidities and hyperinflation are independent risk factors of all-cause mortality in very severe COPD</article-title><source>COPD</source><year>2014</year><month>08</month><volume>11</volume><issue>4</issue><fpage>388</fpage><lpage>400</lpage><pub-id pub-id-type="doi">10.3109/15412555.2013.836174</pub-id><pub-id pub-id-type="medline">24111878</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Erbes</surname><given-names>R</given-names> </name><name name-style="western"><surname>Schaberg</surname><given-names>T</given-names> </name><name name-style="western"><surname>Loddenkemper</surname><given-names>R</given-names> </name></person-group><article-title>Lung function tests in patients with idiopathic pulmonary fibrosis. Are they helpful for predicting outcome?</article-title><source>Chest</source><year>1997</year><month>01</month><volume>111</volume><issue>1</issue><fpage>51</fpage><lpage>57</lpage><pub-id pub-id-type="doi">10.1378/chest.111.1.51</pub-id><pub-id pub-id-type="medline">8995992</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kishaba</surname><given-names>T</given-names> </name><name name-style="western"><surname>Maeda</surname><given-names>A</given-names> </name><name name-style="western"><surname>Yamazato</surname><given-names>S</given-names> </name><name name-style="western"><surname>Nabeya</surname><given-names>D</given-names> </name><name name-style="western"><surname>Yamashiro</surname><given-names>S</given-names> </name><name name-style="western"><surname>Nagano</surname><given-names>H</given-names> </name></person-group><article-title>Radiological and physiological predictors of IPF mortality</article-title><source>Medicina (Kaunas)</source><year>2021</year><month>10</month><day>18</day><volume>57</volume><issue>10</issue><fpage>1121</fpage><pub-id pub-id-type="doi">10.3390/medicina57101121</pub-id><pub-id pub-id-type="medline">34684158</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nishimura</surname><given-names>K</given-names> </name><name name-style="western"><surname>Izumi</surname><given-names>T</given-names> </name><name name-style="western"><surname>Tsukino</surname><given-names>M</given-names> </name><name name-style="western"><surname>Oga</surname><given-names>T</given-names> </name></person-group><article-title>Dyspnea is a better predictor of 5-year survival than airway obstruction in patients with COPD</article-title><source>Chest</source><year>2002</year><month>05</month><volume>121</volume><issue>5</issue><fpage>1434</fpage><lpage>1440</lpage><pub-id pub-id-type="doi">10.1378/chest.121.5.1434</pub-id><pub-id pub-id-type="medline">12006425</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>King</surname><given-names>TE</given-names> </name><name name-style="western"><surname>Tooze</surname><given-names>JA</given-names> </name><name name-style="western"><surname>Schwarz</surname><given-names>MI</given-names> </name><name name-style="western"><surname>Brown</surname><given-names>KR</given-names> </name><name name-style="western"><surname>Cherniack</surname><given-names>RM</given-names> </name></person-group><article-title>Predicting survival in idiopathic pulmonary fibrosis</article-title><source>Am J Respir Crit Care Med</source><year>2001</year><month>10</month><day>1</day><volume>164</volume><issue>7</issue><fpage>1171</fpage><lpage>1181</lpage><pub-id pub-id-type="doi">10.1164/ajrccm.164.7.2003140</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lutfi</surname><given-names>MF</given-names> </name></person-group><article-title>The physiological basis and clinical significance of lung volume measurements</article-title><source>Multidiscip Respir Med</source><year>2017</year><volume>12</volume><fpage>3</fpage><pub-id pub-id-type="doi">10.1186/s40248-017-0084-5</pub-id><pub-id pub-id-type="medline">28194273</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Agust&#x00ED;</surname><given-names>A</given-names> </name><name name-style="western"><surname>Celli</surname><given-names>BR</given-names> </name><name name-style="western"><surname>Criner</surname><given-names>GJ</given-names> </name><etal/></person-group><article-title>Global initiative for chronic obstructive lung disease 2023 report: GOLD executive summary</article-title><source>Eur Respir J</source><year>2023</year><month>04</month><volume>61</volume><issue>4</issue><fpage>2300239</fpage><pub-id pub-id-type="doi">10.1183/13993003.00239-2023</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chiang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Mehta</surname><given-names>K</given-names> </name><name name-style="western"><surname>Amin</surname><given-names>R</given-names> </name></person-group><article-title>Respiratory diagnostic tools in neuromuscular disease</article-title><source>Children (Basel)</source><year>2018</year><month>06</month><day>15</day><volume>5</volume><issue>6</issue><fpage>78</fpage><pub-id pub-id-type="doi">10.3390/children5060078</pub-id><pub-id pub-id-type="medline">29914128</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mehrparvar</surname><given-names>AH</given-names> </name><name name-style="western"><surname>Sakhvidi</surname><given-names>MJZ</given-names> </name><name name-style="western"><surname>Mostaghaci</surname><given-names>M</given-names> </name><name name-style="western"><surname>Davari</surname><given-names>MH</given-names> </name><name name-style="western"><surname>Hashemi</surname><given-names>SH</given-names> </name><name name-style="western"><surname>Zare</surname><given-names>Z</given-names> </name></person-group><article-title>Spirometry values for detecting a restrictive pattern in occupational health settings</article-title><source>Tanaffos</source><year>2014</year><volume>13</volume><issue>2</issue><fpage>27</fpage><lpage>34</lpage><pub-id pub-id-type="medline">25506373</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pellegrino</surname><given-names>R</given-names> </name><name name-style="western"><surname>Viegi</surname><given-names>G</given-names> </name><name name-style="western"><surname>Brusasco</surname><given-names>V</given-names> </name><etal/></person-group><article-title>Interpretative strategies for lung function tests</article-title><source>Eur Respir J</source><year>2005</year><month>11</month><volume>26</volume><issue>5</issue><fpage>948</fpage><lpage>968</lpage><pub-id pub-id-type="doi">10.1183/09031936.05.00035205</pub-id><pub-id pub-id-type="medline">16264058</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dykstra</surname><given-names>BJ</given-names> </name><name name-style="western"><surname>Scanlon</surname><given-names>PD</given-names> </name><name name-style="western"><surname>Kester</surname><given-names>MM</given-names> </name><name name-style="western"><surname>Beck</surname><given-names>KC</given-names> </name><name name-style="western"><surname>Enright</surname><given-names>PL</given-names> </name></person-group><article-title>Lung volumes in 4,774 patients with obstructive lung disease</article-title><source>Chest</source><year>1999</year><month>01</month><volume>115</volume><issue>1</issue><fpage>68</fpage><lpage>74</lpage><pub-id pub-id-type="doi">10.1378/chest.115.1.68</pub-id><pub-id pub-id-type="medline">9925064</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vandevoorde</surname><given-names>J</given-names> </name><name name-style="western"><surname>Verbanck</surname><given-names>S</given-names> </name><name name-style="western"><surname>Schuermans</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Forced vital capacity and forced expiratory volume in six seconds as predictors of reduced total lung capacity</article-title><source>Eur Respir J</source><year>2008</year><month>02</month><volume>31</volume><issue>2</issue><fpage>391</fpage><lpage>395</lpage><pub-id pub-id-type="doi">10.1183/09031936.00032307</pub-id><pub-id pub-id-type="medline">17928313</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="web"><article-title>What is spirometry and why it is done</article-title><source>American Lung Association</source><year>2023</year><access-date>2024-07-20</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.lung.org/lung-health-diseases/lung-procedures-and-tests/spirometry">https://www.lung.org/lung-health-diseases/lung-procedures-and-tests/spirometry</ext-link></comment></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="web"><article-title>Pulmonary function tests</article-title><source>National Heart Lung, and Blood Institute</source><access-date>2024-07-20</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.nhlbi.nih.gov/science/pulmonary-function-lab/tests">https://www.nhlbi.nih.gov/science/pulmonary-function-lab/tests</ext-link></comment></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="web"><article-title>Physician fee schedule</article-title><source>Centers for Medicare and Medicaid Services</source><year>2024</year><access-date>2024-08-05</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.cms.gov/medicare/payment/fee-schedules/physician?redirect=/PhysicianFeeSched">https://www.cms.gov/medicare/payment/fee-schedules/physician?redirect=/PhysicianFeeSched</ext-link></comment></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Burgos</surname><given-names>F</given-names> </name><name name-style="western"><surname>Disdier</surname><given-names>C</given-names> </name><name name-style="western"><surname>de Santamaria</surname><given-names>EL</given-names> </name><etal/></person-group><article-title>Telemedicine enhances quality of forced spirometry in primary care</article-title><source>Eur Respir J</source><year>2012</year><month>06</month><volume>39</volume><issue>6</issue><fpage>1313</fpage><lpage>1318</lpage><pub-id pub-id-type="doi">10.1183/09031936.00168010</pub-id><pub-id pub-id-type="medline">22075488</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Congrete</surname><given-names>S</given-names> </name><name name-style="western"><surname>Metersky</surname><given-names>ML</given-names> </name></person-group><article-title>Telemedicine and remote monitoring as an adjunct to medical management of bronchiectasis</article-title><source>Life (Basel)</source><year>2021</year><month>11</month><day>6</day><volume>11</volume><issue>11</issue><fpage>1196</fpage><pub-id pub-id-type="doi">10.3390/life11111196</pub-id><pub-id pub-id-type="medline">34833072</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liao</surname><given-names>CA</given-names> </name><name name-style="western"><surname>Young</surname><given-names>TH</given-names> </name><name name-style="western"><surname>Cheng</surname><given-names>CT</given-names> </name><etal/></person-group><article-title>The feasibility and efficiency of remote spirometry system on the pulmonary function for multiple ribs fracture patients</article-title><source>J Pers Med</source><year>2021</year><month>10</month><day>23</day><volume>11</volume><issue>11</issue><fpage>1067</fpage><pub-id pub-id-type="doi">10.3390/jpm11111067</pub-id><pub-id pub-id-type="medline">34834419</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Classification model parameters.</p><media xlink:href="ai_v4i1e65456_app1.docx" xlink:title="DOCX File, 18 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Regression model parameters.</p><media xlink:href="ai_v4i1e65456_app2.docx" xlink:title="DOCX File, 18 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Regression model cohort summary.</p><media xlink:href="ai_v4i1e65456_app3.docx" xlink:title="DOCX File, 21 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>Classification model cohort summary.</p><media xlink:href="ai_v4i1e65456_app4.docx" xlink:title="DOCX File, 19 KB"/></supplementary-material><supplementary-material id="app5"><label>Multimedia Appendix 5</label><p>Classification model cohort summary by American Thoracic Society patterns.</p><media xlink:href="ai_v4i1e65456_app5.docx" xlink:title="DOCX File, 22 KB"/></supplementary-material><supplementary-material id="app6"><label>Multimedia Appendix 6</label><p>Regression model performance metrics.</p><media xlink:href="ai_v4i1e65456_app6.docx" xlink:title="DOCX File, 36 KB"/></supplementary-material><supplementary-material id="app7"><label>Multimedia Appendix 7</label><p>Classification model performance metrics.</p><media xlink:href="ai_v4i1e65456_app7.docx" xlink:title="DOCX File, 27 KB"/></supplementary-material></app-group></back></article>