<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR AI</journal-id><journal-id journal-id-type="publisher-id">ai</journal-id><journal-id journal-id-type="index">41</journal-id><journal-title>JMIR AI</journal-title><abbrev-journal-title>JMIR AI</abbrev-journal-title><issn pub-type="epub">2817-1705</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v4i1e73448</article-id><article-id pub-id-type="doi">10.2196/73448</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Leveraging Large Language Models and Machine Learning for Success Analysis in Robust Cancer Crowdfunding Predictions: Quantitative Study</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Bhaumik</surname><given-names>Runa</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Roy</surname><given-names>Abhishikta</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Srivastava</surname><given-names>Vineet</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Boggavarapu</surname><given-names>Lokesh</given-names></name><degrees>BSc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Chandrasekaran</surname><given-names>Ranganathan</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Mensah</surname><given-names>Edward K</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Galvin</surname><given-names>John</given-names></name><degrees>MD, MHA, MS</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Psychiatry, College of Medicine, University of Illinois Chicago</institution><addr-line>1601 West Taylor Street</addr-line><addr-line>Chicago</addr-line><addr-line>IL</addr-line><country>United States</country></aff><aff id="aff2"><institution>Department of Information and Decision Sciences, University of Illinois Chicago</institution><addr-line>Chicago</addr-line><addr-line>IL</addr-line><country>United States</country></aff><aff id="aff3"><institution>Health Policy and Administration, School of Public Health, University of Illinois Chicago</institution><addr-line>Chicago</addr-line><addr-line>IL</addr-line><country>United States</country></aff><aff id="aff4"><institution>Division of Hematology and Oncology, Department of Medicine, College of Medicine, University of Illinois Chicago</institution><addr-line>Chicago</addr-line><addr-line>IL</addr-line><country>United States</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Yin</surname><given-names>Zhijun</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Khosla</surname><given-names>Archit</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Khasnavis</surname><given-names>Nithisha</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Matsuda</surname><given-names>Shinichi</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Runa Bhaumik, PhD, Department of Psychiatry, College of Medicine, University of Illinois Chicago, 1601 West Taylor Street, Chicago, IL, 60612, United States, 1 7085672467; <email>rbhaumik@uic.edu</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>19</day><month>11</month><year>2025</year></pub-date><volume>4</volume><elocation-id>e73448</elocation-id><history><date date-type="received"><day>04</day><month>03</month><year>2025</year></date><date date-type="rev-recd"><day>31</day><month>07</month><year>2025</year></date><date date-type="accepted"><day>13</day><month>10</month><year>2025</year></date></history><copyright-statement>&#x00A9; Runa Bhaumik, Abhishikta Roy, Vineet Srivastava, Lokesh Boggavarapu, Ranganathan Chandrasekaran, Edward K Mensah, John Galvin. Originally published in JMIR AI (<ext-link ext-link-type="uri" xlink:href="https://ai.jmir.org">https://ai.jmir.org</ext-link>), 19.11.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR AI, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.ai.jmir.org/">https://www.ai.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://ai.jmir.org/2025/1/e73448"/><abstract><sec><title>Background</title><p>Recent advances in large language models (LLMs) such as GPT-4o offer a transformative opportunity to extract nuanced linguistic, emotional, and social features from medical crowdfunding campaign texts at scale. These models enable a deeper understanding of the factors influencing campaign success far beyond what structured data alone can reveal. Given these advancements, there is a pressing need for an integrated modeling framework that leverages both LLM-derived features and machine learning algorithms to more accurately predict and explain success in medical crowdfunding.</p></sec><sec><title>Objective</title><p>This study addressed the gap of failure to capture the deeper psychosocial and clinical nuances that influence campaign success. It leveraged cutting-edge machine learning techniques alongside state-of-the-art LLMs such as GPT-4o to automatically generate and extract nuanced linguistic, social, and clinical features from campaign narratives. By combining these features with ensemble learning approaches, the proposed methodology offers a novel and more comprehensive strategy for understanding and predicting crowdfunding success in the medical domain.</p></sec><sec sec-type="methods"><title>Methods</title><p>We used GPT-4o to extract linguistic and social determinants of health features from cancer crowdfunding campaign narratives. A random forest model with permutation importance was applied to rank features based on their contribution to predicting campaign success. Four machine learning algorithms&#x2014;random forest, gradient boosting, logistic regression, and elastic net&#x2014;were evaluated using stratified 10-fold cross-validation, with performance measured through accuracy, sensitivity, and specificity.</p></sec><sec sec-type="results"><title>Results</title><p>Gradient boosting consistently outperformed the other algorithms in terms of sensitivity (consistently 0.786 to 0.798), indicating its superior ability to identify successful crowdfunding campaigns using linguistic and social determinants of health features. The permutation importance score revealed that for severe medical conditions, income loss, chemotherapy treatment, clear and effective communication, cognitive understanding, family involvement, empathy, and social behaviors play an important role in the success of campaigns.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This study demonstrates that LLMs such as GPT-4o can effectively extract nuanced linguistic and social features from crowdfunding narratives, offering deeper insights than traditional methods. These features, when combined with machine learning, significantly improve the identification of key predictors of campaign success, such as medical severity, financial hardship, and empathetic communication. Our findings underscore the potential of LLMs to enhance predictive modeling in health-related crowdfunding and support more targeted policy and communication strategies to reduce financial vulnerability among patients with cancer.</p></sec></abstract><kwd-group><kwd>cancer crowdfunding</kwd><kwd>machine learning</kwd><kwd>large language models</kwd><kwd>linguistic features</kwd><kwd>social determinants of health</kwd><kwd>health policy</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>The cost of cancer care in the United States is increasing rapidly due to various factors, including technological advancements, expensive cutting-edge therapies, and improved access to treatment. Patients with cancer and their families often face substantial financial consequences, such as borrowing money, spending less on food, going into debt, or declaring bankruptcy [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. These issues are exacerbated by a lack of medical insurance or lack of coverage due to health care regulations such as the Affordable Care Act. As a result, patients and caregivers seek help from other sources to raise funds for medical care [<xref ref-type="bibr" rid="ref2">2</xref>].</p><p>Crowdfunding has become a significant tool for raising money through social media and web-based platforms such as Indiegogo, Kickstarter, and GoFundMe, generating US $34.4 billion in 2015 alone [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref7">7</xref>]. Medical crowdfunding constitutes a significant portion of these campaigns in the United States due to gaps in insurance coverage and the prohibitive costs of medical treatments, such as in cancer care, even for those with insurance [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. Success factors for these campaigns include demographic attributes, racial background, campaign images, textual features, and social media characteristics, with campaigns for children attracting more donations than those for adults [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. In cancer treatment crowdfunding, 65.4% of campaigns involve advanced-stage patients, with detailed information about cancer types, treatments, and costs leading to higher fundraising success [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref15">15</xref>]. In addition, research has characterized the use of crowdfunding to support oncology care needs, examining associations between insurance status and other characteristics related to unmet financial obligations [<xref ref-type="bibr" rid="ref13">13</xref>].</p><p>The field of crowdfunding prediction has primarily relied on traditional statistical methods such as linear and logistic regression in previous studies. These methods assume that the input variables are independent from each other. However, when there are correlations among the input variables, using regression methods can lead to larger prediction errors. To overcome this limitation, researchers have turned to machine learning (ML) techniques. ML algorithms have proven to be effective in analyzing hidden associations within large datasets and identifying complex patterns [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. As a result, researchers have used ML algorithms to predict the success of crowdfunding campaigns [<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref20">20</xref>]. This shift in methodology allows for better prediction accuracy and the discovery of more nuanced relationships among the input variables. For instance, ML algorithms such as support vector machine, decision tree, and k-nearest neighbor have been used to predict the success of projects [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref21">21</xref>-<xref ref-type="bibr" rid="ref24">24</xref>]. In addition, algorithms such as extreme gradient boosting, gradient boosting, random forest, and generalized linear models have been used to construct prediction models [<xref ref-type="bibr" rid="ref25">25</xref>].</p><p>Previous crowdfunding research has demonstrated that ML methods can effectively model complex relationships between variables, capture interactions, and yield more accurate and insightful predictions. However, there has been a lack of thorough analysis regarding the selection of predictors and campaign success measures. Furthermore, the application of large language models (LLMs) in the crowdfunding domain remains relatively unexplored. The only study in this domain to date [<xref ref-type="bibr" rid="ref26">26</xref>] has generated insights on medical financial hardship patterns and unmet social needs by leveraging generative artificial intelligence on GoFundMe cancer crowdfunding campaigns using logistic regression.</p><p>In this study, we explored the use of LLMs and ML models to generate and identify predictors of successful campaigns. LLMs are particularly helpful in capturing the semantic meaning of words and phrases in internet-based texts by using word embeddings and contextual embeddings, which were trained on large, diverse texts. GPT-4o [<xref ref-type="bibr" rid="ref27">27</xref>], developed by OpenAI, is an LLM known for its conversational text generation capabilities. We used GPT-4o and prompted relevant campaign information to extract and analyze linguistic and social determinants of health (SDOH) factors. We also provided a robust feature selection based on the permutation technique for a better understanding of the model.</p><p>Our research had three primary objectives: (1) to leverage LLMs, specifically GPT-4o, to automatically generate a wide range of linguistic, social, and clinical features from crowdfunding campaign narratives; (2) to implement a robust feature selection strategy using the random forest algorithm combined with permutation importance to quantify and interpret the relative contribution of each feature to predictive performance without implying causal relationships; and (3) to conduct a comprehensive evaluation of predictive performance across multiple ML algorithms using the key features identified through the random forest&#x2013;based feature selection approach.</p><p>To the best of our knowledge, this study is the first to leverage an LLM for feature extraction and an ML algorithm to establish an effective prediction model for GoFundMe cancer crowdfunding campaigns with a robust feature selection method. By integrating innovative ML algorithms and feature selection strategies into crowdfunding research, we not only advance the academic understanding of this domain but also provide actionable insights that can be directly applied by policymakers and campaign organizers. These advancements are essential for addressing the growing reliance on crowdfunding in the health care sector and ensuring that support reaches those who need it the most.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Ethical Considerations</title><p>All data used in this study were obtained from publicly accessible crowdfunding campaigns on the GoFundMe platform via its public API. The API provides campaign metadata (eg, title, goal amount, amount raised, description text, and campaign category) that are already visible to any online user without registration. No private, donor-level, or personally identifiable information (PII) was accessed, and no authentication was required. The research complied with GoFundMe&#x2019;s published Terms of Service [<xref ref-type="bibr" rid="ref28">28</xref>] at the time of data collection. Because this study only used publicly accessible data, institutional review was not required, as per local guidelines [<xref ref-type="bibr" rid="ref29">29</xref>].</p></sec><sec id="s2-2"><title>Data Collection</title><p>The data for this study were collected from the GoFundMe crowdfunding platform, which is the world&#x2019;s largest platform in terms of both the total amount of funding raised and the total number of active campaigns. Founded in 2010, GoFundMe features campaigns for various categories, including medical, memorials, emergencies, and charitable causes. The data for this analysis were extracted using a combination of application programming interface (API) access and web scraping techniques. GoFundMe stores its data in Algolia, a search and analytics engine. We obtained the necessary API key, secret key, and index name by inspecting the network tab on the GoFundMe website. We connected to the Algolia API using a Python (Python Software Foundation) program and retrieved the data. The API provided access to all records stored in the specified index, which we then processed and stored for further analysis. The data consist of 4990 campaigns for patients&#x2019; oncologic treatment and personal and financial lives that began between January 3, 2023, and December 31, 2023, with funding targets between US $800 and US $100,000.</p></sec><sec id="s2-3"><title>Campaign Success Measure</title><p>We considered a campaign to be successful if it raised a significant percentage of the goal amount. The success ratio was defined as the ratio of funds raised to the campaign goal and was converted to a binary variable at different success thresholds. In this experiment, we selected the success threshold as a ratio of 0.7 based on the observations in exploratory analysis.</p></sec><sec id="s2-4"><title>Predictors of Campaign Success</title><sec id="s2-4-1"><title>Crawled Variables</title><p>We collected key campaign data, including launch date, title, description, current raised amount, target goal, number of donors, and campaign duration. These details provide insights into each campaign&#x2019;s progress and engagement.</p></sec><sec id="s2-4-2"><title>SDOH and Medical-Related Variables</title><p>The selected variables were obtained from the Linguistic Inquiry and Word Count (Pennebaker Conglomerates, Inc) internal dictionary [<xref ref-type="bibr" rid="ref30">30</xref>] and the Centers for Disease Control and Prevention indicators [<xref ref-type="bibr" rid="ref31">31</xref>]. In addition, we incorporated several new variables related to medical procedures and treatment factors to enhance the dataset. A full categorization of these variables is provided in <xref ref-type="table" rid="table1">Table 1</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Categorization of the extracted features used for crowdfunding campaign analysis.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Category</td><td align="left" valign="bottom">Factors</td></tr></thead><tbody><tr><td align="left" valign="top">Cognitive and psychological</td><td align="left" valign="top">Analytic thinking, cognition, tone, risk, reward, empathy, politeness, and authenticity</td></tr><tr><td align="left" valign="top">Linguistic and communication</td><td align="left" valign="top">Clout, linguistic content, communication, present tense, past tense, and future tense</td></tr><tr><td align="left" valign="top">Medical and health</td><td align="left" valign="top">Cancer site, stage or grade of cancer, type of therapy, treatment status, treatment duration, engagement in health care activities, comorbidities, association with health care organizations and facilities (hospices, hospitals, nursing homes, skilled nursing facilities, and emergency rooms)</td></tr><tr><td align="left" valign="top">Emotional states</td><td align="left" valign="top">Stress, anxiety, mental or behavioral dysfunctions, chronic diseases, cognitive content of communications, expression of social concerns, informal language (swear words and online abbreviations), sentiment (positive, negative, or neutral), and trust in medical care facilities</td></tr><tr><td align="left" valign="top">Employment and education</td><td align="left" valign="top">Employment status, work disruption (for individuals aged &#x2265;18 years), school absenteeism, work absenteeism, and parents&#x2019; work disruption (for beneficiaries aged &#x003C;18 years)</td></tr><tr><td align="left" valign="top">Financial and medical support</td><td align="left" valign="top">Lack of sick leave, lack of medical attention, income loss, family income loss, struggles with medical expenses, housing expenses, food expenses, and transportation expenses</td></tr><tr><td align="left" valign="top">Medical procedures and treatments</td><td align="left" valign="top">Laboratory procedures, diagnostic procedures, cancer-specific treatments (chemotherapy and radiotherapy), preventive procedures, alternative physical therapy, occupational therapy, and mental health or substance abuse therapy</td></tr><tr><td align="left" valign="top">Organizations and facilities</td><td align="left" valign="top">Association with health care&#x2013;related organizations, professional societies, self-help organizations, relief organizations, and receiving care in specific facilities (hospices, hospitals, nursing homes, skilled nursing facilities, emergency rooms, or mental health or substance abuse facilities)</td></tr><tr><td align="left" valign="top">Mental state, sentiment, or trust</td><td align="left" valign="top">Presence of stress, anxiety, mental or behavioral dysfunctions, or chronic diseases; sentiment (positive, negative, or neutral); and level of trust in medical care facilities</td></tr></tbody></table></table-wrap></sec></sec><sec id="s2-5"><title>Experimental Setup</title><sec id="s2-5-1"><title>Feature Extraction and Selection Methodology</title><p>The variables were programmatically generated using GPT-4o, a state-of-the-art LLM from OpenAI, through a structured prompting pipeline designed to extract nuanced semantic, emotional, and contextual signals and other factors from campaign narratives. We used a zero-shot prompting strategy tailored to identify all the variables. For example, the following was a representative prompt used: &#x201C;Analyze the following crowdfunding campaign description and return the sadness (0 -low and 1 -high) score or whether patient struggles with expenses for medical treatments (yes or no),).&#x201D;</p><p>We manually evaluated GPT-4o&#x2013;based feature outputs for a random sample of 50 crowdfunding campaigns to assess consistency and accuracy. Each campaign was processed using the GPT-4o API with temperature set to 0.5, maximum tokens limited to 256, and top_p (probabilistic decoding parameter) set to 1.0 to ensure stable and contextually appropriate responses. Manual review involved comparing GPT-4o&#x2013;extracted linguistic and SDOH features against human-annotated references. The observed validation error ranged from 0.06 to 0.08, indicating high reliability and supporting the use of GPT-4o for automated feature generation in this study.</p><p>Postprocessing routines were developed to convert the generated responses into structured binary or ordinal variables, which were then added to the campaign-level dataset. These extracted features were then categorized, standardized, and incorporated into downstream statistical and ML models to quantify their relative importance. Importantly, we separately evaluated the contributions of linguistic and SDOH feature sets using permutation-based feature importance within an ensemble random forest classifier, ensuring that observed effects were interpreted as associations within predictive contexts and not causal mechanisms.</p><p>We applied minimum-maximum normalization to variables with large value ranges (target amount, raised amount, number of donors, and campaign duration) to minimize their impact on prediction results. GPT-4o was used to standardize measures of linguistics and campaign predictors between 0 and 1. The predictors for social and demographic identity, as well as medical-related predictors, were extracted as a binary (yes or no) and dummy coded.</p></sec><sec id="s2-5-2"><title>ML Algorithms</title><p>We conducted 2 comparative ML experiments to evaluate the predictive utility of different feature sets in determining the success of cancer-related crowdfunding campaigns. In both experiments, the dataset was divided into training (70%) and testing (30%) subsets, and all models were validated using 10-fold stratified cross-validation on the training data to ensure robustness and minimize overfitting.</p><p>In the first experiment, we focused on linguistic and campaign-level features. Linguistic features&#x2014;such as tone, empathy, clout, and sentiment&#x2014;were extracted using GPT-4o through structured prompts. These were combined with campaign-level metadata such as fundraising goals, campaign duration, and update frequency. To evaluate the contribution of individual features to prediction performance, we initially trained a random forest classifier using the scikit-learn library (Google Summer of Code project) on the training dataset, with the number of trees set to 100 and the minimum samples required to split an internal node (min_samples_split) set to 2. These parameter values were selected based on a grid search optimization process in which they achieved the highest accuracy (0.72). For feature importance, we used permutation importance, a model-agnostic approach that measures the decline in model performance when each feature is randomly shuffled. This method was applied within the training set to assess the relative contribution of each feature. The features were then ranked by their permutation importance scores. On the basis of these rankings, we constructed a series of feature subsets including the top 3, 6, 9, 12, and 15 features.</p><p>In the second experiment, we applied the same methodology to a different set of features&#x2014;those reflecting social, demographic, and medical information. These included SDOH (eg, references to employment status, caregiving responsibilities, and financial hardship), demographic attributes (eg, inferred race or ethnicity), and medically relevant content (eg, mentions of chemotherapy, hospice care, or immunotherapy). These features were similarly extracted using GPT-4o with custom prompts designed to infer relevant categories from the narrative descriptions in the campaign text. As with the first experiment, random forest with permutation-based feature importance was used to rank features within the training set, and model performance was assessed at various thresholds of top N features.</p><p>For both experiments, we also evaluated the performance of 3 additional ML models: gradient boosting (min_samples_split=2; n_estimators=100), logistic regression, and elastic net (solver=&#x201C;saga&#x201D;; l1_ratio=0.5) with default parameter settings. We evaluated model performance using subsets of the highest-ranked features, testing configurations with 3, 6, 9, 12, and 15 features to provide a comparative perspective. Model performance was assessed using 3 evaluation metrics: accuracy, sensitivity, and specificity. Sensitivity was defined as the ratio of true positives (successful campaigns) to the sum of true positives and false negatives, specificity was defined as the ratio of true negatives (unsuccessful campaigns) to the sum of true negatives and false positives, and accuracy was defined as the proportion of correct predictions out of all predictions made.</p></sec></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Descriptive Analysis</title><p>In our analysis, we used a dataset of crowdfunding campaigns to explore their success in relation to their progress toward the established goal amounts. The descriptive statistics of the raised amounts provided valuable insights into the overall distribution and characteristics of the dataset. Among the 4990 campaigns analyzed, the mean amount raised was US $20,016.67 (SD US $26,456.97), with a median of US $11,819 (IQR US $17,383). Similarly, the mean goal amount among the scraped links was US $40,373.73 (SD US $55,043.88), and the median was US $25,000 (IQR US $38,000). We divided the dataset into 5 distinct groups by categorizing the data into percentile ranges based on the distribution of goal amounts. Each group was of equal size: US $799.99 to US $10,000, US $10,000 to US $20,000, US $20,000 to US $30,000, US $30,000 to US $50,000, and US $50,000 to US $100,000.</p><p><xref ref-type="fig" rid="figure1">Figure 1</xref> illustrates that the donor-to-campaigner ratio increased steadily across goal-amount percentiles, indicating that campaigns with larger targets typically mobilized more donors on average. The alignment between the linear and locally estimated scatterplot smoothing curves suggests that this relationship is approximately linear, though a mild upward curvature at the upper end (80k-100k) may reflect heightened engagement for high-visibility or urgent medical cases. The broader confidence band among large-goal campaigns implies heterogeneity in donor response, consistent with the notion that some high-goal efforts achieve viral reach while others fail to gain traction. Overall, this pattern supports the hypothesis that higher fundraising targets often signaling greater medical severity or broader social networks are associated with enhanced donor participation efficiency.</p><p><xref ref-type="fig" rid="figure2">Figure 2</xref> shows that as the success ratio threshold increases, the proportion of successful campaigns decreases, whereas the number of unsuccessful campaigns increases. This trend is expected as higher thresholds represent more ambitious funding goals, which are harder to achieve.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Donor-to-campaigner efficiency curve for medical crowdfunding campaigns. Linear trend: slope=304.167; intercept=35.000; <italic>R</italic><sup>2</sup>=0.966; <italic>P</italic>=.003. LOESS: locally estimated scatterplot smoothing.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v4i1e73448_fig01.png"/></fig><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Distribution of crowdfunding campaigns based on their success ratio.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v4i1e73448_fig02.png"/></fig><p><xref ref-type="fig" rid="figure3">Figure 3</xref> shows the ratio of mean campaign span (days) to total campaigns within each success-ratio category: unsuccessful (&#x003C;0.5), moderate (0.5-0.7), successful (0.7-1.0), and highly successful (&#x003E; 1.0). Campaigns achieving higher success ratios exhibited greater relative span durations (approximately 0.41 for highly successful vs approximately 0.05 for unsuccessful campaigns). The upward pattern indicates that prolonged visibility and sustained engagement are associated with improved crowdfunding outcomes, whereas unsuccessful campaigns tend to terminate earlier and attract fewer donors.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Ratio of average span to total campaigns by success ratio.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v4i1e73448_fig03.png"/></fig></sec><sec id="s3-2"><title>Socioeconomic Variables and Their Association With Campaign Success</title><p>To assess the role of socioeconomic context in campaign outcomes, we analyzed 5 key variables derived from campaign narratives: work absenteeism, educational activity, friend, struggles with monthly bills, and struggles with food. Work absenteeism captured whether the individual referenced missing work due to illness or treatment, indicating employment disruption and potential income loss. Educational activity included references to school attendance or disruptions to education, suggesting that the campaign involved students or caregivers with educational responsibilities. The friend variable identified campaigns organized by or for a friend, providing insights into the patient&#x2019;s social network and potential campaign reach. Struggles with monthly bills flagged mentions of difficulty affording recurring monthly expenses (eg, rent and utilities), serving as a direct marker of financial strain. Struggling with food indicated food insecurity, reflecting the inability to afford sufficient or nutritious food. Each of these variables was statistically tested for its association with campaign success using chi-square analysis. Although none reached statistical significance at <italic>P</italic>&#x003C;.05, work absenteeism showed a marginal association (<italic>&#x03C7;</italic><sup>2</sup><sub>1</sub>=4.7; <italic>P</italic>=.10), suggesting a potential trend worth further investigation.</p></sec><sec id="s3-3"><title>Campaign Success Determinants</title><p><xref ref-type="fig" rid="figure4">Figure 4</xref> shows the top 13 important features (SDOH) in predicting success at a 0.7 success ratio for the gradient boosting algorithm. Permutation importance score is a metric that indicates how much a particular feature contributes to the predictive power of an ML model. On the basis of the chart, the fact that being in the hospital or in unspecified hospice care was highly important highlights the severe medical conditions often associated with crowdfunding campaigns. Policymakers could use this information to identify areas in which the medical system is failing to cover critical care, prompting discussions on improving hospital funding or hospice services. The importance of income loss suggests that financial hardship due to illness is a key driver of crowdfunding success. This implies that patients need better income protection policies or insurance solutions to support individuals who face financial difficulties due to medical conditions. The involvement of health care organizations as a feature suggests that campaigns supported by these organizations might have better access to resources than campaigns organized by individuals. The importance of chemotherapy treatment as a feature suggests that crowdfunding campaigns associated with this treatment might attract more attention and support, possibly because donors recognize the high costs and seriousness of cancer treatment. In addition, female patients in general tend to have more successful campaigns.</p><p><xref ref-type="fig" rid="figure5">Figure 5</xref> shows the permutation importance scores of various linguistic features related to some aspect of behavior or decision-making, possibly in a medical or social context. The features are ranked by their importance in predicting an outcome, with higher scores indicating a greater influence on the model&#x2019;s performance. The top 4 predictors are risk, clear communication, cognitive style, and family involvement. Empathy and social behaviors are cultivated in professional contexts, and positive messaging should be encouraged across various communication channels. Although less critical, addressing factors such as anger, lifestyle, and reward could further enhance outcomes. These policy recommendations aim to leverage the most influential factors identified by the model to achieve better decision-making and outcomes in the relevant context.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Relative importance of social determinants of health (SDOH) features in predicting crowdfunding campaign success (success ratio threshold=0.7).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v4i1e73448_fig04.png"/></fig><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Top linguistic features ranked by permutation importance in predicting campaign success.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="ai_v4i1e73448_fig05.png"/></fig></sec><sec id="s3-4"><title>Performance Evaluation of ML Models</title><p><xref ref-type="table" rid="table2">Table 2</xref> and <xref ref-type="table" rid="table3">Table 3</xref> present the performance evaluation of 4 ML algorithms&#x2014;random forest, gradient boosting, logistic regression, and elastic net&#x2014;at a 0.7 success ratio threshold for SDOH and linguistic factors. The reported performance metrics are accuracy, sensitivity, and specificity across different subsets of top features (ranging from top 3 to top 15). Gradient boosting consistently outperformed the other algorithms in terms of accuracy (consistently 0.786 to 0.788), indicating its superior ability to identify successful crowdfunding campaigns. Random forest offered a balanced performance with good accuracy (0.767 to 0.769) and specificity (0.831 to 0.863), making it a reliable choice for predicting crowdfunding success while capturing nonlinear relationships and interactions. Logistic regression and elastic net exhibited strong specificity (0.997 to 0.999) but poor sensitivity (0.013 to 0.052), which suggests that they may be overly conservative and are not able to predict successful campaigns correctly.</p><p>On the basis of the evaluation, when using gradient boosting, selecting the top 3 to 12 features seems optimal. The top 3 features provide a strong balance of high accuracy and sensitivity with fewer variables, making the model simpler and potentially more generalizable. If one aims to maximize model performance with a bit more complexity, one can consider using up to the top 12 features, which slightly enhances specificity without sacrificing other metrics.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Performance evaluation of machine learning algorithms at a 0.7 success ratio threshold for social determinants of health factors.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom" colspan="2">Models and metrics</td><td align="left" valign="bottom">Top 3 features</td><td align="left" valign="bottom">Top 6 features</td><td align="left" valign="bottom">Top 9 features</td><td align="left" valign="bottom">Top 12 features</td><td align="left" valign="bottom">Top 15 features</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="7">Random forest</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Accuracy</td><td align="char" char="." valign="top">0.77</td><td align="char" char="." valign="top">0.77</td><td align="char" char="." valign="top">0.76</td><td align="char" char="." valign="top">0.78<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td><td align="char" char="." valign="top">0.76</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Sensitivity</td><td align="char" char="." valign="top">0.66</td><td align="char" char="." valign="top">0.66</td><td align="char" char="." valign="top">0.65</td><td align="char" char="." valign="top">0.66</td><td align="char" char="." valign="top">0.61</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Specificity</td><td align="char" char="." valign="top">0.83</td><td align="char" char="." valign="top">0.83</td><td align="char" char="." valign="top">0.83</td><td align="char" char="." valign="top">0.84</td><td align="char" char="." valign="top">0.85</td></tr><tr><td align="left" valign="top" colspan="7">Gradient boosting</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Accuracy</td><td align="char" char="." valign="top">0.79</td><td align="char" char="." valign="top">0.78</td><td align="char" char="." valign="top">0.78</td><td align="char" char="." valign="top">0.79<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td><td align="char" char="." valign="top">0.79</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Sensitivity</td><td align="char" char="." valign="top">0.69</td><td align="char" char="." valign="top">0.69</td><td align="char" char="." valign="top">0.69</td><td align="char" char="." valign="top">0.69</td><td align="char" char="." valign="top">0.69</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Specificity</td><td align="char" char="." valign="top">0.84</td><td align="char" char="." valign="top">0.84</td><td align="char" char="." valign="top">0.84</td><td align="char" char="." valign="top">0.84</td><td align="char" char="." valign="top">0.84</td></tr><tr><td align="left" valign="top" colspan="7">Logistic</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Accuracy</td><td align="char" char="." valign="top">0.64</td><td align="char" char="." valign="top">0.64</td><td align="char" char="." valign="top">0.64</td><td align="char" char="." valign="top">0.64<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td><td align="char" char="." valign="top">0.64</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Sensitivity</td><td align="char" char="." valign="top">0.01</td><td align="char" char="." valign="top">0.01</td><td align="char" char="." valign="top">0.01</td><td align="char" char="." valign="top">0.02</td><td align="char" char="." valign="top">0.02</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Specificity</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">1.00</td></tr><tr><td align="left" valign="top" colspan="7">Elastic net</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Accuracy</td><td align="char" char="." valign="top">0.65</td><td align="char" char="." valign="top">0.65</td><td align="char" char="." valign="top">0.65</td><td align="char" char="." valign="top">0.65<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td><td align="char" char="." valign="top">0.65</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Sensitivity</td><td align="char" char="." valign="top">0.04</td><td align="char" char="." valign="top">0.05</td><td align="char" char="." valign="top">0.05</td><td align="char" char="." valign="top">0.05</td><td align="char" char="." valign="top">0.05</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Specificity</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">1.00</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>Italics indicate the highest accuracy values across the 4 algorithms. </p></fn></table-wrap-foot></table-wrap><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Performance evaluation of machine learning algorithms at a 0.7 success ratio threshold for linguistic factors.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="top" colspan="2">Models and metrics</td><td align="left" valign="top">Top 3 features</td><td align="left" valign="top">Top 6 features</td><td align="left" valign="top">Top 9 features</td><td align="left" valign="top">Top 12 features</td><td align="left" valign="top">Top 15 features</td></tr><tr><td align="left" valign="top" colspan="7">Random forest</td></tr></thead><tbody><tr><td align="left" valign="top"/><td align="left" valign="top">Accuracy</td><td align="char" char="." valign="top">0.77</td><td align="char" char="." valign="top">0.78</td><td align="char" char="." valign="top">0.78</td><td align="char" char="." valign="top">0.79<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="char" char="." valign="top">0.79</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Sensitivity</td><td align="char" char="." valign="top">0.69</td><td align="char" char="." valign="top">0.69</td><td align="char" char="." valign="top">0.69</td><td align="char" char="." valign="top">0.69</td><td align="char" char="." valign="top">0.67</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Specificity</td><td align="char" char="." valign="top">0.81</td><td align="char" char="." valign="top">0.84</td><td align="char" char="." valign="top">0.84</td><td align="char" char="." valign="top">0.85</td><td align="char" char="." valign="top">0.86</td></tr><tr><td align="left" valign="top" colspan="7">Gradient boosting</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Accuracy</td><td align="char" char="." valign="top">0.80</td><td align="char" char="." valign="top">0.80</td><td align="char" char="." valign="top">0.80</td><td align="char" char="." valign="top">0.80<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="char" char="." valign="top">0.80</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Sensitivity</td><td align="char" char="." valign="top">0.72</td><td align="char" char="." valign="top">0.73</td><td align="char" char="." valign="top">0.72</td><td align="char" char="." valign="top">0.72</td><td align="char" char="." valign="top">0.72</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Specificity</td><td align="char" char="." valign="top">0.84</td><td align="char" char="." valign="top">0.84</td><td align="char" char="." valign="top">0.84</td><td align="char" char="." valign="top">0.84</td><td align="char" char="." valign="top">0.80</td></tr><tr><td align="left" valign="top" colspan="7">Logistic</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Accuracy</td><td align="char" char="." valign="top">0.63</td><td align="char" char="." valign="top">0.63</td><td align="char" char="." valign="top">0.63</td><td align="char" char="." valign="top">0.64<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="char" char="." valign="top">0.64</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Sensitivity</td><td align="char" char="." valign="top">0.02</td><td align="char" char="." valign="top">0.03</td><td align="char" char="." valign="top">0.03</td><td align="char" char="." valign="top">0.06</td><td align="char" char="." valign="top">0.06</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Specificity</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">1.00</td></tr><tr><td align="left" valign="top" colspan="7">Elastic net</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Accuracy</td><td align="char" char="." valign="top">0.65</td><td align="char" char="." valign="top">0.65</td><td align="char" char="." valign="top">0.65</td><td align="char" char="." valign="top">0.66<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="char" char="." valign="top">0.66</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Sensitivity</td><td align="char" char="." valign="top">0.08</td><td align="char" char="." valign="top">0.08</td><td align="char" char="." valign="top">0.09</td><td align="char" char="." valign="top">0.11</td><td align="char" char="." valign="top">0.11</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Specificity</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">1.00</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>Italics indicate the highest accuracy values across the 4 algorithms.</p></fn></table-wrap-foot></table-wrap><p>The results indicate that careful feature selection is crucial for optimizing model performance for linguistic features. Gradient boosting and random forest showed that selecting approximately the top 12 features provides a strong balance between sensitivity and specificity, making them well suited for predictive tasks in medical crowdfunding. Logistic regression may require a different approach or fewer features to avoid unnecessary complexity, whereas elastic net&#x2019;s performance suggests that a moderate feature increase (up to 18-24 features) could be beneficial. Overall, the findings highlight the importance of tailored feature selection strategies to maximize the effectiveness of ML models in this domain.</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>In this study, we conducted an empirical analysis of medical crowdfunding. The analysis of 4984 crowdfunding campaigns revealed key insights into the relationship among goal amounts, campaign success, and donor engagement. Campaigns with higher goals (US $50,000-$100,000) attracted significantly more donors, indicating that ambitious targets may signal substantial projects, thus drawing greater support. Conversely, lower goal amounts (US $799.99-$10,000) were the most prevalent, suggesting a preference for achievable targets among campaigners. Highly successful campaigns had longer durations, averaging over 250 days. We also focused on deriving features using LLMs and feature selection via the random forest algorithm. We identified donors, goal amount, and span of campaign as critical predictors of success, with emotional and thematic features also contributing to campaign success. Among the ML models evaluated, gradient boosting demonstrated superior performance (range 0.786-0.788) and true positive rate (range 0.693-0.696), outperforming random forest, logistic regression, and elastic net. The analysis highlights the critical role of linguistic and SDOH predictors in the success of crowdfunding campaigns. Linguistic features such as clear and effective communication, particularly regarding risk, along with positive messaging, empathy, and social behaviors, significantly influence campaign outcomes. SDOH predictors, including the severity of medical conditions (eg, hospitalization or unspecified hospice care), income loss, and the involvement of health care organizations, are also key drivers of crowdfunding success. These findings suggest a need for improved hospital funding, better income protection policies, and stronger support from health care organizations. In addition, campaigns associated with high-cost treatments such as chemotherapy tend to attract more attention, underscoring the need for targeted support for patients undergoing such treatments.</p></sec><sec id="s4-2"><title>Limitations</title><p>This study has several limitations. It primarily focused on linguistic, social, demographic, and medical-related features. Other factors, such as donor engagement metrics or campaign visibility on social media platforms, were not evaluated. While cross-validation helps in mitigating overfitting, the generalizability of the model to other types of crowdfunding campaigns beyond the specific dataset used (eg, different medical conditions, geographic regions, or platforms) remains uncertain. The model&#x2019;s performance may vary when applied to other datasets, limiting its broader applicability. This study relied on the available dataset for training and testing. If the dataset is not representative of all cancer crowdfunding campaigns (eg, biased toward certain demographics, treatment types, or socioeconomic groups), the model may not perform well in more diverse or less represented scenarios. Ultimately, the default parameters we chose for random forest feature selection due to a superior performance than that of the grid search method may not be applicable or effective for different datasets.</p></sec><sec id="s4-3"><title>Comparison With Previous Studies</title><p>The findings that communication regarding risk, social behaviors, and empathy play a crucial role in influencing donor behavior have been documented in a previous study [<xref ref-type="bibr" rid="ref32">32</xref>], where it was found that emotionally compelling narratives significantly improve crowdfunding outcomes. Research highlighting the financial burden [<xref ref-type="bibr" rid="ref33">33</xref>] of cancer care provides further support for income loss as a significant predictor. The importance of factors such as being in a hospital or receiving chemotherapy treatment is supported by studies showing that campaigns related to severe or high-cost treatments, such as advanced-stage cancers, often receive more attention and donations [<xref ref-type="bibr" rid="ref34">34</xref>]. Our study also sheds light on new insights on medical crowdfunding. The analysis introduces the importance of specific linguistic features, such as the use of positive language and social behavior indicators, which have not been as thoroughly explored in previous studies. The involvement of health care organizations as a significant predictor suggests that campaigns backed by institutions might have better access to resources and are perceived as more credible.</p></sec><sec id="s4-4"><title>Conclusions</title><p>The reliance on crowdfunding for conditions associated with high-importance features such as hospital stays and income loss highlights potential gaps in health care funding. Policymakers need to assess where these gaps are and consider reforms or additional support mechanisms to reduce the need for crowdfunding in critical areas. The variability in the importance of different features may also point to inequities in access to health care and financial support. Policymakers can better target support to vulnerable populations such as those with comorbidities. A crucial policy objective is ensuring that all individuals, regardless of their medical or financial situation, have equal access to medical care without crowdfunding.</p></sec></sec></body><back><ack><p>The authors thank the Department of Psychiatry and Cancer Center at the College of Medicine, University of Illinois Chicago, for providing computing resources and research support. The authors acknowledge the use of artificial intelligence tool (Microsoft Co-Pilot) for editing the manuscript.</p></ack><notes><sec><title>Data Availability</title><p>The datasets generated or analyzed during this study are available in the GitHub repository [<xref ref-type="bibr" rid="ref35">35</xref>].</p></sec></notes><fn-group><fn fn-type="con"><p>RB, JG, and EKM conceptualized the study. RB, VS, and AR wrote the code and generated the tables and figures. LB contributed to data collection, coding, and analysis. RB and AR wrote the manuscript.</p></fn><fn fn-type="conflict"><p>EKM is an Editor-in-Chief at JMIR Publications. The other authors declare no conflicts of interest.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">API</term><def><p>application programming interface</p></def></def-item><def-item><term id="abb2">LLM</term><def><p>large language model</p></def></def-item><def-item><term id="abb3">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb4">SDOH</term><def><p>social determinants of health</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jeffery</surname><given-names>DD</given-names> </name><name name-style="western"><surname>Linton</surname><given-names>A</given-names> </name></person-group><article-title>The impact of depression as a cancer comorbidity: rates, health care utilization, and associated costs</article-title><source>Community Oncol</source><year>2012</year><month>07</month><volume>9</volume><issue>7</issue><fpage>216</fpage><lpage>221</lpage><pub-id pub-id-type="doi">10.1016/j.cmonc.2012.06.002</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pan</surname><given-names>X</given-names> </name><name name-style="western"><surname>Sambamoorthi</surname><given-names>U</given-names> </name></person-group><article-title>Health care expenditures associated with depression in adults with cancer</article-title><source>J Community Support Oncol</source><year>2015</year><month>07</month><volume>13</volume><issue>7</issue><fpage>240</fpage><lpage>247</lpage><pub-id pub-id-type="doi">10.12788/jcso.0150</pub-id><pub-id pub-id-type="medline">26270540</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mausbach</surname><given-names>BT</given-names> </name><name name-style="western"><surname>Irwin</surname><given-names>SA</given-names> </name></person-group><article-title>Depression and healthcare service utilization in patients with cancer</article-title><source>Psychooncology</source><year>2017</year><month>08</month><volume>26</volume><issue>8</issue><fpage>1133</fpage><lpage>1139</lpage><pub-id pub-id-type="doi">10.1002/pon.4133</pub-id><pub-id pub-id-type="medline">27102731</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Beaulieu</surname><given-names>T</given-names> </name><name name-style="western"><surname>Sarker</surname><given-names>S</given-names> </name><name name-style="western"><surname>Sarker</surname><given-names>S</given-names> </name></person-group><article-title>A conceptual framework for understanding crowdfunding</article-title><source>Commun Assoc Inf Syst</source><year>2015</year><volume>37</volume><fpage>87</fpage><pub-id pub-id-type="doi">10.17705/1CAIS.03701</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Belleflamme</surname><given-names>P</given-names> </name><name name-style="western"><surname>Lambert</surname><given-names>T</given-names> </name><name name-style="western"><surname>Schwienbacher</surname><given-names>A</given-names> </name></person-group><article-title>Crowdfunding: tapping the right crowd</article-title><source>J Bus Ventur</source><year>2014</year><month>09</month><volume>29</volume><issue>5</issue><fpage>585</fpage><lpage>609</lpage><pub-id pub-id-type="doi">10.1016/j.jbusvent.2013.07.003</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Koch</surname><given-names>JA</given-names> </name><name name-style="western"><surname>Siering</surname><given-names>M</given-names> </name></person-group><article-title>The recipe of successful crowdfunding campaigns: an analysis of crowdfunding success factors and their interrelations</article-title><source>Electron Mark</source><year>2019</year><volume>29</volume><issue>4</issue><fpage>661</fpage><lpage>679</lpage><pub-id pub-id-type="doi">10.1007/s12525-019-00357-8</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Blanchard</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Noseworthy</surname><given-names>TJ</given-names> </name><name name-style="western"><surname>Pancer</surname><given-names>E</given-names> </name><name name-style="western"><surname>Poole</surname><given-names>M</given-names> </name></person-group><article-title>Extraction of visual information to predict crowdfunding success</article-title><source>Production and Operations Management</source><year>2023</year><month>12</month><volume>32</volume><issue>12</issue><fpage>4172</fpage><lpage>4189</lpage><pub-id pub-id-type="doi">10.1111/poms.14083</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gilligan</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Alberts</surname><given-names>DS</given-names> </name><name name-style="western"><surname>Roe</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>Skrepnek</surname><given-names>GH</given-names> </name></person-group><article-title>Death or debt? National estimates of financial toxicity in persons with newly-diagnosed cancer</article-title><source>Am J Med</source><year>2018</year><month>10</month><volume>131</volume><issue>10</issue><fpage>1187</fpage><lpage>1199</lpage><pub-id pub-id-type="doi">10.1016/j.amjmed.2018.05.020</pub-id><pub-id pub-id-type="medline">29906429</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Igra</surname><given-names>M</given-names> </name></person-group><article-title>Donor financial capacity drives racial inequality in medical crowdsourced funding</article-title><source>Soc Forces</source><year>2022</year><month>04</month><day>29</day><volume>100</volume><issue>4</issue><fpage>1856</fpage><lpage>1883</lpage><pub-id pub-id-type="doi">10.1093/sf/soab076</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gleasure</surname><given-names>R</given-names> </name><name name-style="western"><surname>Feller</surname><given-names>J</given-names> </name></person-group><article-title>Does heart or head rule donor behaviors in charitable crowdfunding markets?</article-title><source>Int J Electron Commer</source><year>2016</year><month>10</month><volume>20</volume><issue>4</issue><fpage>499</fpage><lpage>524</lpage><pub-id pub-id-type="doi">10.1080/10864415.2016.1171975</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Saleh</surname><given-names>SN</given-names> </name><name name-style="western"><surname>Ajufo</surname><given-names>E</given-names> </name><name name-style="western"><surname>Lehmann</surname><given-names>CU</given-names> </name><name name-style="western"><surname>Medford</surname><given-names>RJ</given-names> </name></person-group><article-title>A comparison of online medical crowdfunding in Canada, the UK, and the US</article-title><source>JAMA Netw Open</source><year>2020</year><month>10</month><day>1</day><volume>3</volume><issue>10</issue><fpage>e2021684</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2020.21684</pub-id><pub-id pub-id-type="medline">33104206</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Snyder</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zenone</surname><given-names>M</given-names> </name><name name-style="western"><surname>Caulfield</surname><given-names>T</given-names> </name></person-group><article-title>Crowdfunding for complementary and alternative medicine: what are cancer patients seeking?</article-title><source>PLoS ONE</source><year>2020</year><volume>15</volume><issue>11</issue><fpage>e0242048</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0242048</pub-id><pub-id pub-id-type="medline">33216790</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Song</surname><given-names>S</given-names> </name><name name-style="western"><surname>Cohen</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>Lui</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Use of GoFundMe<sup>&#x00AE;</sup> to crowdfund complementary and alternative medicine treatments for cancer</article-title><source>J Cancer Res Clin Oncol</source><year>2020</year><month>07</month><volume>146</volume><issue>7</issue><fpage>1857</fpage><lpage>1865</lpage><pub-id pub-id-type="doi">10.1007/s00432-020-03191-0</pub-id><pub-id pub-id-type="medline">32219517</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lubl&#x00F3;y</surname><given-names>&#x00C1;</given-names> </name></person-group><article-title>Medical crowdfunding in a healthcare system with universal coverage: an exploratory study</article-title><source>BMC Public Health</source><year>2020</year><month>11</month><day>9</day><volume>20</volume><issue>1</issue><fpage>1672</fpage><pub-id pub-id-type="doi">10.1186/s12889-020-09693-3</pub-id><pub-id pub-id-type="medline">33167927</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ghazal</surname><given-names>LV</given-names> </name><name name-style="western"><surname>Watson</surname><given-names>SE</given-names> </name><name name-style="western"><surname>Gentry</surname><given-names>B</given-names> </name><name name-style="western"><surname>Santacroce</surname><given-names>SJ</given-names> </name></person-group><article-title>&#x201C;Both a life saver and totally shameful&#x201D;: young adult cancer survivors&#x2019; perceptions of medical crowdfunding</article-title><source>J Cancer Surviv</source><year>2023</year><month>04</month><volume>17</volume><issue>2</issue><fpage>332</fpage><lpage>341</lpage><pub-id pub-id-type="doi">10.1007/s11764-022-01188-x</pub-id><pub-id pub-id-type="medline">35169983</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Friedman</surname><given-names>J</given-names> </name><name name-style="western"><surname>Hastie</surname><given-names>T</given-names> </name><name name-style="western"><surname>Tibshirani</surname><given-names>R</given-names> </name></person-group><article-title>Regularization paths for generalized linear models via coordinate descent</article-title><source>J Stat Softw</source><year>2010</year><volume>33</volume><issue>1</issue><fpage>1</fpage><lpage>22</lpage><pub-id pub-id-type="doi">10.1371/journal.pone.0242048</pub-id><pub-id pub-id-type="medline">20808728</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Breiman</surname><given-names>L</given-names> </name></person-group><article-title>Random forests</article-title><source>Mach Learn</source><year>2001</year><month>10</month><volume>45</volume><issue>1</issue><fpage>5</fpage><lpage>32</lpage><pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Greenberg</surname><given-names>MD</given-names> </name><name name-style="western"><surname>Pardo</surname><given-names>B</given-names> </name><name name-style="western"><surname>Hariharan</surname><given-names>K</given-names> </name><name name-style="western"><surname>Gerber</surname><given-names>E</given-names> </name></person-group><article-title>Crowdfunding support tools: predicting success &#x0026; failure</article-title><conf-name>Conference on Extended Abstracts on Human Factors in Computing Systems</conf-name><conf-date>Apr 27 to May 2, 2013</conf-date><pub-id pub-id-type="doi">10.1145/2468356.2468682</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Etter</surname><given-names>V</given-names> </name><name name-style="western"><surname>Grossglauser</surname><given-names>M</given-names> </name><name name-style="western"><surname>Thiran</surname><given-names>P</given-names> </name></person-group><article-title>Launch hard or go home!: predicting the success of kickstarter campaigns</article-title><conf-name>1st ACM Conference on Online Social Networks</conf-name><conf-date>Oct 7-8, 2013</conf-date><pub-id pub-id-type="doi">10.1145/2512938.2512957</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Peng</surname><given-names>L</given-names> </name><name name-style="western"><surname>Cui</surname><given-names>G</given-names> </name><name name-style="western"><surname>Bao</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>S</given-names> </name></person-group><article-title>Speaking the same language: the power of words in crowdfunding success and failure</article-title><source>Mark Lett</source><year>2022</year><month>06</month><volume>33</volume><issue>2</issue><fpage>311</fpage><lpage>323</lpage><pub-id pub-id-type="doi">10.1007/s11002-021-09595-3</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yeh</surname><given-names>JY</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>CH</given-names> </name></person-group><article-title>A machine learning approach to predict the success of crowdfunding fintech project</article-title><source>JEIM</source><year>2022</year><month>11</month><day>24</day><volume>35</volume><issue>6</issue><fpage>1678</fpage><lpage>1696</lpage><pub-id pub-id-type="doi">10.1108/JEIM-01-2019-0017</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ghahramani</surname><given-names>Z</given-names> </name></person-group><article-title>Probabilistic machine learning and artificial intelligence</article-title><source>Nature New Biol</source><year>2015</year><month>05</month><day>28</day><volume>521</volume><issue>7553</issue><fpage>452</fpage><lpage>459</lpage><pub-id pub-id-type="doi">10.1038/nature14541</pub-id><pub-id pub-id-type="medline">26017444</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Mitra</surname><given-names>T</given-names> </name><name name-style="western"><surname>Gilbert</surname><given-names>E</given-names> </name></person-group><article-title>The language that gets people to give: phrases that predict success on kickstarter</article-title><conf-name>17th ACM Conference on Computer Supported Cooperative Work &#x0026; Social Computing</conf-name><conf-date>Feb 15-19, 2014</conf-date><pub-id pub-id-type="doi">10.1145/2531602.2531656</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>W</given-names> </name><name name-style="western"><surname>Zheng</surname><given-names>H</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>YJ</given-names> </name></person-group><article-title>Prediction of fundraising outcomes for crowdfunding projects based on deep learning: a multimodel comparative study</article-title><source>Soft Comput</source><year>2020</year><month>06</month><volume>24</volume><issue>11</issue><fpage>8323</fpage><lpage>8341</lpage><pub-id pub-id-type="doi">10.1007/s00500-020-04822-x</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Jhaveri</surname><given-names>S</given-names> </name><name name-style="western"><surname>Khedkar</surname><given-names>I</given-names> </name><name name-style="western"><surname>Kantharia</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Jaswal</surname><given-names>S</given-names> </name></person-group><article-title>Success prediction using random forest, catboost, xgboost and adaboost for kickstarter campaigns</article-title><conf-name>2019 3rd International Conference on Computing Methodologies and Communication (ICCMC)</conf-name><conf-date>Mar 27-29, 2019</conf-date><pub-id pub-id-type="doi">10.1109/ICCMC.2019.8819828</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zheng</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>S</given-names> </name><name name-style="western"><surname>Islami</surname><given-names>F</given-names> </name><name name-style="western"><surname>Banegas</surname><given-names>MP</given-names> </name><name name-style="western"><surname>Yabroff</surname><given-names>R</given-names> </name></person-group><article-title>Cancer survivors&#x2019; use of crowdfunding campaigns: AI-generated patterns of reported medical financial hardship and unmet social needs</article-title><source>JCO Oncology Practice</source><year>2023</year><month>11</month><volume>19</volume><issue>11_suppl</issue><fpage>542</fpage><pub-id pub-id-type="doi">10.1200/OP.2023.19.11_suppl.542</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="other"><person-group person-group-type="author"><collab>OpenAI</collab></person-group><article-title>GPT-4 technical report</article-title><source>arXiv</source><access-date>2025-10-22</access-date><comment>Preprint posted online on  Mar 23, 2023</comment><comment><ext-link ext-link-type="uri" xlink:href="https://cdn.openai.com/papers/gpt-4.pdf">https://cdn.openai.com/papers/gpt-4.pdf</ext-link></comment></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="web"><article-title>GoFundMe terms of service</article-title><source>GoFund Me</source><access-date>2025-11-06</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.gofundme.com/c/terms">https://www.gofundme.com/c/terms</ext-link></comment></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="web"><article-title>UIC Research</article-title><source>University of Illinois Chicago</source><access-date>2025-11-19</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://research.uic.edu/uicresearch/">https://research.uic.edu/uicresearch/</ext-link></comment></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Friedman</surname><given-names>JH</given-names> </name></person-group><article-title>Greedy function approximation: a gradient boosting machine</article-title><source>Ann Statist</source><year>2001</year><volume>29</volume><issue>5</issue><pub-id pub-id-type="doi">10.1214/aos/1013203451</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Tao</surname><given-names>X</given-names> </name><name name-style="western"><surname>Ji</surname><given-names>B</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>R</given-names> </name><name name-style="western"><surname>S&#x00F6;rensen</surname><given-names>S</given-names> </name></person-group><article-title>The success of cancer crowdfunding campaigns: project and text analysis</article-title><source>J Med Internet Res</source><year>2023</year><month>03</month><day>3</day><volume>25</volume><fpage>e44197</fpage><pub-id pub-id-type="doi">10.2196/44197</pub-id><pub-id pub-id-type="medline">36692283</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Holler</surname><given-names>JT</given-names> </name><name name-style="western"><surname>Sadighian</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Ghaffar</surname><given-names>U</given-names> </name></person-group><article-title>Online medical crowdfunding in the United States: a cross-sectional analysis of gendered cancer campaign outcomes</article-title><source>J Mens Health</source><year>2023</year><volume>19</volume><issue>3</issue><fpage>29</fpage><lpage>37</lpage><pub-id pub-id-type="doi">10.22514/jomh.2023.022</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Burtch</surname><given-names>G</given-names> </name><name name-style="western"><surname>Chan</surname><given-names>J</given-names> </name></person-group><article-title>Reducing medical bankruptcy through crowdfunding: evidence from giveforward</article-title><access-date>2025-10-22</access-date><conf-name>35th International Conference on Information Systems</conf-name><conf-date>Dec 14-17, 2014</conf-date><comment><ext-link ext-link-type="uri" xlink:href="https://aisel.aisnet.org/cgi/viewcontent.cgi?article=1463&#x0026;context=icis2014">https://aisel.aisnet.org/cgi/viewcontent.cgi?article=1463&#x0026;context=icis2014</ext-link></comment></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cohen</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>Brody</surname><given-names>H</given-names> </name><name name-style="western"><surname>Patino</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Use of an online crowdfunding platform for unmet financial obligations in cancer care</article-title><source>JAMA Intern Med</source><year>2019</year><month>12</month><day>1</day><volume>179</volume><issue>12</issue><fpage>1717</fpage><lpage>1720</lpage><pub-id pub-id-type="doi">10.1001/jamainternmed.2019.3330</pub-id><pub-id pub-id-type="medline">31498408</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="web"><article-title>Rbhaumik/crowdfunding</article-title><source>GitHub</source><access-date>2025-11-10</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://github.com/rbhaumik/crowdfunding">https://github.com/rbhaumik/crowdfunding</ext-link></comment></nlm-citation></ref></ref-list></back></article>