<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR AI</journal-id>
      <journal-title>JMIR AI</journal-title>
      <issn pub-type="epub">2817-1705</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v3i1e51834</article-id>
      <article-id pub-id-type="pmid">38875562</article-id>
      <article-id pub-id-type="doi">10.2196/51834</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Cost, Usability, Credibility, Fairness, Accountability, Transparency, and Explainability Framework for Safe and Effective Large Language Models in Medical Education: Narrative Review and Qualitative Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>El Emam</surname>
            <given-names>Khaled</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Sedaghat</surname>
            <given-names>Sam</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Senst</surname>
            <given-names>Benjamin</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Pandey</surname>
            <given-names>Monu</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Kulkarni</surname>
            <given-names>Sourabh</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Quttainah</surname>
            <given-names>Majdi</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6280-1060</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Mishra</surname>
            <given-names>Vinaytosh</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>College of Healthcare Management and Economics</institution>
            <institution>Gulf Medical University</institution>
            <addr-line>Al Jurf 1</addr-line>
            <addr-line>Ajman, 4184</addr-line>
            <country>United Arab Emirates</country>
            <phone>971 503310560</phone>
            <email>vinaytosh@gmail.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6360-910X</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Madakam</surname>
            <given-names>Somayya</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6708-2061</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Lurie</surname>
            <given-names>Yotam</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0078-2503</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Mark</surname>
            <given-names>Shlomo</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2484-3542</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>College of Business Administration</institution>
        <institution>Kuwait University</institution>
        <addr-line>Kuwait</addr-line>
        <country>Kuwait</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>College of Healthcare Management and Economics</institution>
        <institution>Gulf Medical University</institution>
        <addr-line>Ajman</addr-line>
        <country>United Arab Emirates</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Information Technology</institution>
        <institution>Birla Institute of Management Technology</institution>
        <institution>Knowledge Park - II</institution>
        <addr-line>Greater Noida</addr-line>
        <country>India</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of Management</institution>
        <institution>Ben-Gurion University</institution>
        <addr-line>Negev</addr-line>
        <country>Israel</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Department of Software Engineering</institution>
        <institution>Shamoon College of Engineering</institution>
        <addr-line>Ashdod</addr-line>
        <country>Israel</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Vinaytosh Mishra <email>vinaytosh@gmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>23</day>
        <month>4</month>
        <year>2024</year>
      </pub-date>
      <volume>3</volume>
      <elocation-id>e51834</elocation-id>
      <history>
        <date date-type="received">
          <day>16</day>
          <month>8</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>11</day>
          <month>12</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>20</day>
          <month>12</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>3</day>
          <month>2</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Majdi Quttainah, Vinaytosh Mishra, Somayya Madakam, Yotam Lurie, Shlomo Mark. Originally published in JMIR AI (https://ai.jmir.org), 23.04.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR AI, is properly cited. The complete bibliographic information, a link to the original publication on https://www.ai.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://ai.jmir.org/2024/1/e51834" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>The world has witnessed increased adoption of large language models (LLMs) in the last year. Although the products developed using LLMs have the potential to solve accessibility and efficiency problems in health care, there is a lack of available guidelines for developing LLMs for health care, especially for medical education.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aim of this study was to identify and prioritize the enablers for developing successful LLMs for medical education. We further evaluated the relationships among these identified enablers.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>A narrative review of the extant literature was first performed to identify the key enablers for LLM development. We additionally gathered the opinions of LLM users to determine the relative importance of these enablers using an analytical hierarchy process (AHP), which is a multicriteria decision-making method. Further, total interpretive structural modeling (TISM) was used to analyze the perspectives of product developers and ascertain the relationships and hierarchy among these enablers. Finally, the cross-impact matrix-based multiplication applied to a classification (MICMAC) approach was used to determine the relative driving and dependence powers of these enablers. A nonprobabilistic purposive sampling approach was used for recruitment of focus groups.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The AHP demonstrated that the most important enabler for LLMs was <italic>credibility</italic>, with a priority weight of 0.37, followed by <italic>accountability</italic> (0.27642) and <italic>fairness</italic> (0.10572). In contrast, <italic>usability</italic>, with a priority weight of 0.04, showed negligible importance. The results of TISM concurred with the findings of the AHP. The only striking difference between expert perspectives and user preference evaluation was that the product developers indicated that <italic>cost</italic> has the least importance as a potential enabler. The MICMAC analysis suggested that cost has a strong influence on other enablers. The inputs of the focus group were found to be reliable, with a consistency ratio less than 0.1 (0.084).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This study is the first to identify, prioritize, and analyze the relationships of enablers of effective LLMs for medical education. Based on the results of this study, we developed a comprehendible prescriptive framework, named CUC-FATE (Cost, Usability, Credibility, Fairness, Accountability, Transparency, and Explainability), for evaluating the enablers of LLMs in medical education. The study findings are useful for health care professionals, health technology experts, medical technology regulators, and policy makers.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>large language model</kwd>
        <kwd>LLM</kwd>
        <kwd>ChatGPT</kwd>
        <kwd>CUC-FATE framework</kwd>
        <kwd>cost, usability, credibility, fairness, accountability, transparency, and explainability</kwd>
        <kwd>analytical hierarchy process</kwd>
        <kwd>AHP</kwd>
        <kwd>total interpretive structural modeling</kwd>
        <kwd>TISM</kwd>
        <kwd>medical education</kwd>
        <kwd>adoption</kwd>
        <kwd>guideline</kwd>
        <kwd>development</kwd>
        <kwd>health care</kwd>
        <kwd>chat generative pretrained transformer</kwd>
        <kwd>generative language model tool</kwd>
        <kwd>user</kwd>
        <kwd>innovation</kwd>
        <kwd>data generation</kwd>
        <kwd>narrative review</kwd>
        <kwd>health care professional</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Natural language programming solutions have been available for the last 15 years. However, these models recently witnessed an avalanche breakdown with the launch of ChatGPT by OpenAI, a company that was only established recently (December 2015) after receiving an investment from Elon Musk and others. ChatGPT is a generative language model tool that enables users to converse with machines about various subjects. With 1.6 billion monthly users, this freemium is the fastest-growing application in the history of the internet. Since its release on November 30, 2022, ChatGPT has sparked much discussion and enthusiasm in multiple industries, including medicine. ChatGPT and related technologies have been identified as disruptive innovations with the potential to revolutionize academia and scholarly publishing [<xref ref-type="bibr" rid="ref1">1</xref>]. Additionally, preliminary research suggests that ChatGPT has practical applications throughout the clinical workflow [<xref ref-type="bibr" rid="ref2">2</xref>].</p>
        <p>The introduction of ChatGPT and the subsequent release of several extended products and functional plugins have profoundly impacted scientific researchers. These products have also influenced the ideas and methodologies used in traditional research, including recommendation, emotion recognition, and information generation. ChatGPT’s assistance has improved some of the associated work in these fields, particularly with providing helpful supplementary information to raise the caliber of data generation. With the integration of machine learning and artificial intelligence (AI) technologies, medical imaging has advanced quickly. Among these developments, using cutting-edge language models such as large language models (LLMs), ChatGPT, and GPT-4 has shown significant promise in elevating several elements of medical imaging and revolutionizing radiology. These models can produce and comprehend human-like text owing to access to various textbooks, journals, and research materials available on the internet. This could provide the necessary context and prior knowledge to support a variety of tasks involving medical imaging, such as synthesis, reconstruction, analysis, segmentation, interpretation, automated reporting, and more. These technologies have further been improved using supervised and reinforcement learning methods based on OpenAI’s GPT LLMs. These models have shown excellent performance in various natural language processing (NLP) tasks, including language translation, text summarization, and question-answering. The models have been pretrained on enormous amounts of text data. Users can ask questions, obtain responses, and engage in genuine conversation with the bot given ChatGPT’s human-like conversational experience.</p>
        <p>ChatGPT and other LLMs remain a research hotspot in multimedia analysis and application. However, several crucial difficulties must be resolved, including (1) improving interactions with ChatGPT to collect more useful auxiliary information, (2) methods to combine ChatGPT with traditional inquiries to fully exploit its benefits, and (3) analyzing the data obtained from ChatGPT for their incorporation with the intended usage. A particularly significant challenge is to effectively use past information obtained with such huge models and to ensure consistency and complementary features across many modalities to improve multimodal generation performance, which is especially relevant for AI-generated content. The finest use cases for ChatGPT, a well-liked chatbot built on a potent AI language model, are still being worked out. ChatGPT can provide help in writing an essay, thesis, or dissertation by creating a research question, developing a plan, developing literary concepts, rewriting text, and getting feedback. Moreover, the NLP and automated data analysis capabilities offered by ChatGPT enable researchers, marketers, and organizations to analyze text quickly and accurately. Via its AI-powered functions, ChatGPT can help to spot significant trends and insights in a data set that might otherwise be challenging to find. Additionally, ChatGPT can assist with the creation of top-notch prompts for paper analysis.</p>
      </sec>
      <sec>
        <title>LLM Functionality</title>
        <p>ChatGPT is a prediction system that anticipates what it should write based on previously processed texts. This type of AI is known as a language model. However, ChatGPT offers more promise than its predecessors given that it is trained on enormous amounts of data, with the majority of these data originating from the abundant supply of data available on the internet. According to OpenAI, ChatGPT was also trained on examples of back-and-forth human interaction, which results in a conversation style that is much more human than that of other chatbots, thus advancing the capability of NLP solutions.</p>
        <p>NLP is a field of AI employing linguistics, statistics, and machine learning to enable computers to comprehend spoken language. NLP systems can infer meaning from spoken or written words, including all of the subtleties and complexities of an accurate narrative text. This makes it possible for machines to obtain value from even unstructured data. NLP has witnessed significant advancements in recent years. An LLM is a deep-learning algorithm that can be used to perform NLP tasks, including, among other abilities, summarizing and generating text. As one of the main applications, LLM-based chatbots are computer programs that can simulate conversations with human users. NLP techniques can be used to enable chatbots to understand and respond to user input. LLM uses deep-learning techniques to understand and generate human language, which requires training on vast amounts of text data and then uses statistical algorithms to learn patterns and relationships within language. These models can perform various tasks, including language translation, question-answering, sentiment analysis, and summarization. With ChatGPT, users can learn, compare, and validate answers for different academic subjects, including physics, math, and chemistry, as well as abstract topics such as philosophy and religion [<xref ref-type="bibr" rid="ref3">3</xref>]. Users can also generate human-like text such as news articles, chatbot conversations, and even literary works such as essays and romantic poems. The main difference of GPTs from other LLMs lies in their architecture and training methodology. GPTs are based on a deep-learning architecture known as a “transformer.” Transformers are designed to process sequential data such as language more efficiently than other architectures. LLMs are currently at the forefront of intertwining AI systems with human communication and everyday life [<xref ref-type="bibr" rid="ref4">4</xref>]. Large pretrained language models have significantly advanced NLP research with respect to various applications [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. Although these more complicated language models can produce complex and coherent natural language, several recent studies have shown that they can also pick up unfavorable social biases that can feed into negative stereotypes [<xref ref-type="bibr" rid="ref7">7</xref>].</p>
      </sec>
      <sec>
        <title>NLP in Health Care</title>
        <p>Health care consumers may turn to the research literature for information not provided in patient-friendly documents. However, reading medical literature can be difficult. One study identified four key elements made possible by NLP to increase access to medical papers: explanations of foreign terminology, plain language section summaries, a list of crucial questions that direct readers to the portions that provide the answers, and simple language summaries of those passages [<xref ref-type="bibr" rid="ref8">8</xref>]. Significant advancements in smart health care have been made in recent years, with new AI technologies enabling a range of intelligent applications in various health care contexts. NLP, as a fundamental AI-powered technology that can analyze and comprehend human language, is crucial for smart health care [<xref ref-type="bibr" rid="ref9">9</xref>]. NLP methods have been utilized to organize data in health care systems by sifting out pertinent information from narrative texts to offer information for decision-making. Thus, NLP approaches help to lower health care costs and are essential for streamlining health care procedures [<xref ref-type="bibr" rid="ref10">10</xref>]. Advancements in NLP will make robotic process automation possible in health care, which can further drive efficiency. Health care data are complex, which should be given due consideration at the time of designing health care applications. Deep-learning approaches such as convolutional neural network and recurrent neural network models have become prominent in health care applications, demonstrating promising accuracy. Nevertheless, there is still substantial room for improvement of these models to enable their usage without human supervision. Deep-learning techniques offer an effective and efficient model for data analysis by revealing hidden patterns and extracting valuable information from a large volume of health data, which standard analytics cannot perform within a given time frame [<xref ref-type="bibr" rid="ref11">11</xref>].</p>
      </sec>
      <sec>
        <title>ChatGPT in Medical Education</title>
        <p>ChatGPT has many potential applications in health care education, research, and practice [<xref ref-type="bibr" rid="ref12">12</xref>], which can enhance medical education by helping students develop subjective learning and expression skills [<xref ref-type="bibr" rid="ref13">13</xref>]. The number of ChatGPT users has shown exponential growth and the tool is increasingly utilized by students, residents, and attending physicians to direct learning and answer clinical questions [<xref ref-type="bibr" rid="ref14">14</xref>]. However, authors using ChatGPT professionally for academic work should exercise caution as it remains unclear how ChatGPT handles hazardous content, false information, or plagiarism [<xref ref-type="bibr" rid="ref15">15</xref>]. While ChatGPT can simplify the task of radiological reporting, there is still a chance of inaccurate statements and missing medical information [<xref ref-type="bibr" rid="ref15">15</xref>]. Therefore, the tool needs refinement before it can be used widely with confidence in medicine [<xref ref-type="bibr" rid="ref16">16</xref>]. A recent review explored ChatGPT’s applications and reported various challenges such as ethical concerns, data biases, and safety issues [<xref ref-type="bibr" rid="ref17">17</xref>]. Thus, it is imperative to balance AI-assisted innovation and human expertise [<xref ref-type="bibr" rid="ref18">18</xref>]. ChatGPT has quickly gained significant attention from academia, research, and industries despite these shortcomings. The first aim of this study was therefore to determine the requirements, or enablers, for a successful LLM application in medical education using a narrative review of the existing literature.</p>
      </sec>
      <sec>
        <title>Enablers of LLM for Medical Education</title>
        <p>For the purpose of this study, we refer to enablers as the factors, resources, or conditions that facilitate or support achieving a good LLM application for medical education. Medical education prepares would-be physicians and other health care professionals with the knowledge, skills, and attitudes necessary for competent and compassionate patient care. The general definition of an enabler is a factor that makes it easier for a goal to be realized or for someone to accomplish a particular task. Enablers of LLM for medical education can be tangible or intangible and should play a crucial role in achieving the outcomes expected from the application.</p>
        <p>As LLMs are trained on massive data, they are resource-demanding tools. Therefore, the cost of training an LLM for medical education may be prohibitive [<xref ref-type="bibr" rid="ref19">19</xref>]. Accordingly, it is imperative to use efficient computing to address this issue [<xref ref-type="bibr" rid="ref20">20</xref>]. Usability is one of the key criteria that determines the usefulness of an application in medical education, and LLMs are no exception [<xref ref-type="bibr" rid="ref21">21</xref>]. The extant literature has highlighted usability as an important criterion for the successful implementation of a new technology in education [<xref ref-type="bibr" rid="ref22">22</xref>]. Similarly, the credibility of an application is another very important factor for technological interventions used in medical education [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. Although ChatGPT has disclaimers about the source of information provided, it does not disclose its sources categorically, and can sometimes hallucinate about the source, which may be misleading to the user. LLMs also have reported issues with fairness, computation, and privacy. By perpetuating social prejudices and stereotypes, they risk causing unfair discrimination and physical harm, along with potential harm to the user’s reputation [<xref ref-type="bibr" rid="ref25">25</xref>]. Ma et al [<xref ref-type="bibr" rid="ref26">26</xref>] provided an overview of fairness of LLMs in multilingual and non-English situations, emphasizing the limitations of recent studies and the challenges faced by English-only methodologies [<xref ref-type="bibr" rid="ref26">26</xref>].</p>
        <p>Another issue of LLMs such as ChatGPT is related to their accountability, generally defined as taking responsibility for one’s obligation to treat others honestly and morally. However, it is unclear who will be held accountable and responsible if the LLM provides incorrect recommendations or forecasts for a particular downstream activity. Overall, employing LLMs is associated with considerable risk; therefore, precautions must be taken to minimize these risks and ensure their ethical and responsible use. To foster a cross-disciplinary global inclusive consensus on the ethical use, disclosure, and proper reporting of generative AI models such as GPT and other LLM technologies in academia, Cacciamani et al [<xref ref-type="bibr" rid="ref23">23</xref>] proposed the ChatGPT, Generative Artificial Intelligence, and Natural Large Language Models for Accountable Reporting and Use Guidelines initiative in 2023. However, the underlying model of GPT3.5 deviates from the ethical guidelines proposed by Cacciamani et al [<xref ref-type="bibr" rid="ref23">23</xref>]. Another important criterion reported for the medical applications of LLMs is transparency, which is an essential ethical consideration in the fields of science, engineering, business, and the humanities. Transparency refers to functioning in a way that makes it simple for others to observe what actions have been taken [<xref ref-type="bibr" rid="ref27">27</xref>], thus representing a sign of responsibility, honesty, and openness. Conversely, LLMs are opaque to users. Recently suggested explainability techniques aim to make LLMs more transparent. Although these techniques are not a cure-all, they might form the basis for the development of models with fewer flaws or, at the very least, the ability to explain their logic. In their systematic experiments with synthetic data, Wu et al [<xref ref-type="bibr" rid="ref28">28</xref>] demonstrated that autoregressive and masked language models can successfully learn to emulate semantic relations between expressions with strong transparency, where all expressions have context-independent denotations.</p>
        <p>Finally, the LLMs used in medical education must be explainable, and the best freely available options lag in this respect. Most LLMs are complex models built using deep learning [<xref ref-type="bibr" rid="ref29">29</xref>]; therefore, these models can produce better predictions with more information or network parameters, which comes at a cost of sacrificing explainability. Some models fail to describe how they came to their conclusion. Recently suggested explainability techniques aim to make language models more transparent. Even though these are not complete solutions, they can act as the basis for the development of less problematic models or, at the very least, models that can explain their logic. However, Du et al [<xref ref-type="bibr" rid="ref30">30</xref>] identified false patterns detected by LLMs using explainability in their study.</p>
      </sec>
      <sec>
        <title>Need for This Study</title>
        <p>The need for this study arises from the rapid integration of LLMs such as ChatGPT in various fields, including medical education. Although LLMs offer promising benefits for health care, their effective integration in medical education remains a developing area. Accordingly, the aim of this study was to identify and prioritize the key enablers for successful LLM implementation in medical education. This can in turn help to address the lack of comprehensive frameworks guiding the development and use of LLMs in this field. By exploring the dynamics of various enablers such as credibility, accountability, fairness, cost, usability, transparency, and explainability, this study provides a structured approach to enhance the quality and effectiveness of LLMs in educating health care professionals.</p>
        <p>Specifically, this study was based on the following three major research questions: (1) What are the enablers of a suitable LLM application for medical education? (2) What is the relative importance of these enablers in achieving the goals of medical education? and (3) What is an approach to developing an LLM to achieve medical education goals? With this background, the following research objectives were set: (1) identify the enablers of a suitable LLM for medical education, (2) prioritize the identified enablers in achieving the goals of medical education, and (3) propose a framework for developing an LLM to achieve the medical education goals.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Study Design</title>
        <p>To achieve the first research objective, we performed a narrative review of the extant literature published on technology solutions in medical education. A narrative review is a scholarly article synthesizing existing research on a particular topic in a narrative or story-like manner. Unlike systematic reviews or meta-analyses, which use rigorous methodologies to analyze and summarize research findings quantitatively, narrative reviews provide a qualitative, comprehensive overview of a subject. Narrative reviews often involve critical analysis and discussion, integrating the authors’ expertise and interpretation. Narrative reviews are thus useful for obtaining a broad understanding of a topic and identifying trends, gaps, and controversies within a field.</p>
        <p>Two authors (SM and VM) searched the Scopus, Web of Science, and Google Scholar databases to identify suitable literature for our narrative review. The inclusion criteria were articles published in the English language in the last 5 years. In the second stage, duplicates and articles for which the full text was unavailable were eliminated. The identified enablers from this review were then used to address the first research question. These enablers were presented in front of a focus group comprising seven experts working in universities and institutions delivering medical education in India and the United Arab Emirates to validate the selection (<xref ref-type="table" rid="table1">Table 1</xref>). The focus group endorsed the choice of the enablers for further research; in addition, one article published in 2010 was added on the recommendation of the focus group as it was found to be useful in explaining competing interests in medical education. One author (VM) facilitated the focus group discussion to obtain the finalize list of enablers.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Characteristics of the focus group for validation of identified enablers.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="250"/>
            <col width="240"/>
            <col width="140"/>
            <col width="130"/>
            <col width="240"/>
            <thead>
              <tr valign="top">
                <td>Expert</td>
                <td>Qualification</td>
                <td>Experience (years)</td>
                <td>Age (years)</td>
                <td>Nationality</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Cardiologist</td>
                <td>Masters in Medicine</td>
                <td>12</td>
                <td>42</td>
                <td>India</td>
              </tr>
              <tr valign="top">
                <td>Endocrinologist</td>
                <td>Masters in Medicine</td>
                <td>20</td>
                <td>45</td>
                <td>India</td>
              </tr>
              <tr valign="top">
                <td>Technology expert</td>
                <td>Doctor of Philosophy</td>
                <td>15</td>
                <td>50</td>
                <td>United Arab Emirates</td>
              </tr>
              <tr valign="top">
                <td>Dentistry educator</td>
                <td>Masters in Dentistry</td>
                <td>10</td>
                <td>40</td>
                <td>United Arab Emirates</td>
              </tr>
              <tr valign="top">
                <td>Podiatrist educator</td>
                <td>Doctor of Philosophy</td>
                <td>10</td>
                <td>35</td>
                <td>United Arab Emirates</td>
              </tr>
              <tr valign="top">
                <td>Diabetes educator</td>
                <td>Doctor of Philosophy</td>
                <td>18</td>
                <td>43</td>
                <td>India</td>
              </tr>
              <tr valign="top">
                <td>Nursing educator</td>
                <td>Doctor of Philosophy</td>
                <td>15</td>
                <td>41</td>
                <td>United Arab Emirates</td>
              </tr>
              <tr valign="top">
                <td>Radiologist</td>
                <td>Doctor of Philosophy</td>
                <td>12</td>
                <td>41</td>
                <td>India</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Analytical Hierarchy Process Modeling</title>
        <p>An analytical hierarchy process (AHP) was utilized to achieve the second study objective of prioritizing the identified enablers for developing an LLM for medical education. The AHP is a popular method for determining the relative importance of the criteria in a multicriteria decision analysis task. To date, the AHP has been extensively used in the management and social science fields [<xref ref-type="bibr" rid="ref31">31</xref>]. The advantage of this process is that it incorporates the mechanisms to assure reliability in the decision-making case of ambiguity. Some researchers have suggested using a “fuzzy” version of the AHP [<xref ref-type="bibr" rid="ref32">32</xref>] and others have suggested using the entropy weight method to reduce the negative effect of individual subjective evaluation bias on the accuracy of comprehensive evaluation [<xref ref-type="bibr" rid="ref33">33</xref>]. Since the ranking obtained by the AHP method was further validated by total interpretive structural modeling (TISM) in this study (see below), fuzzy logic or entropy weight was avoided in our AHP modeling. The five steps used for AHP are: (1) defining the decision problem, (2) creating a hierarchy, (3) pairwise comparison, (4) deriving a weighted priority, and (5) consistency check for decision. We used the Delphi method for pairwise comparisons. A cut-off value of 75% was used to accept the value for the pairwise comparison. The standard scale proposed by Saaty [<xref ref-type="bibr" rid="ref34">34</xref>] was used for the pairwise comparison.</p>
      </sec>
      <sec>
        <title>TISM and Focus Groups</title>
        <p>Finally, to address the third research objective, we investigated the relationships among key enablers to inform the development of a suitable medical education LLM. A qualitative research design is useful to understand a phenomenon under study rather than assessing the strength and direction of causal relationships in a conceptual model [<xref ref-type="bibr" rid="ref35">35</xref>]. For this purpose, we established a focus group with five experts in the fields of information technology and product development with relevant research experience. The details of this expert group are provided in <xref ref-type="table" rid="table2">Table 2</xref>.</p>
        <p>According to the information obtained from the focus group, TISM was used to model the enablers for a medical education LLM application. In his seminal paper, Sushil [<xref ref-type="bibr" rid="ref36">36</xref>] provides a detailed account of the interpretation of interpretive structural modeling and TISM, highlighting the advantage of the latter over the former. For the sake of brevity, we have not included the details of the TISM method herein, which can be found in the relevant literature [<xref ref-type="bibr" rid="ref37">37</xref>]. In brief, TISM is a process that converts poorly articulated mental models of systems into visible and well-defined models that are useful for gaining better understanding and decision-making. The presence and absence of a relationship between enablers were ascertained based on an unstructured interview of the focus group conducted by one researcher (SM). If more than 50% of the focus group members indicated that there is a relationship between two enablers, the enabler was considered to be present, which was coded as “Y.” An overview of the TISM approach used in this study is provided in <xref rid="figure1" ref-type="fig">Figure 1</xref>.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Characteristics of the focus group used for total interpretive structural modeling.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="240"/>
            <col width="260"/>
            <col width="140"/>
            <col width="130"/>
            <col width="230"/>
            <thead>
              <tr valign="top">
                <td>Expert</td>
                <td>Qualification</td>
                <td>Experience (years)</td>
                <td>Age (years)</td>
                <td>Country</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Product development</td>
                <td>Masters in management</td>
                <td>21</td>
                <td>42</td>
                <td>Singapore</td>
              </tr>
              <tr valign="top">
                <td>Product development</td>
                <td>Bachelors in engineering</td>
                <td>21</td>
                <td>42</td>
                <td>United Arab Emirates</td>
              </tr>
              <tr valign="top">
                <td>Technology expert</td>
                <td>Bachelors in engineering</td>
                <td>19</td>
                <td>40</td>
                <td>India</td>
              </tr>
              <tr valign="top">
                <td>Technology expert</td>
                <td>Masters in engineering</td>
                <td>10</td>
                <td>33</td>
                <td>India</td>
              </tr>
              <tr valign="top">
                <td>Decision science expert</td>
                <td>Doctor of Philosophy</td>
                <td>10</td>
                <td>38</td>
                <td>India</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Summary of the total interpretive structural modeling (TISM) approach used in the study. Adapted from Mishra and Rana [<xref ref-type="bibr" rid="ref33">33</xref>].</p>
          </caption>
          <graphic xlink:href="ai_v3i1e51834_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>We further used cross-impact matrix multiplication applied to classification (MICMAC) analysis to evaluate the direct and indirect relationships among various elements in a complex system. MICMAC analysis is applied to the reachability matrix to classify the elements into four categories based on their driving power (ability to influence other elements) and dependence (level of being influenced by other elements).</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>This study, involving a qualitative focus group discussion, did not require approval from an ethical review board as it did not involve human subjects in a manner necessitating such review. No informed consent was required for the same reason. However, to maintain ethical standards, we ensured that all data collected were either anonymized or deidentified. This means that any information that could potentially identify individual participants was removed or altered to protect their privacy. No compensation was provided to participants, as is common in studies of this nature. This decision was made considering the study design and the ethical imperative to avoid undue influence on participants’ responses. The absence of compensation was communicated to all participants. Throughout the study, we adhered to strict data protection protocols to safeguard the confidentiality of the information shared during the focus group discussions. These measures included secure data storage, restricted access to authorized personnel, and adherence to data protection laws and regulations. This approach ensured that the privacy and integrity of participant information were always maintained.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>AHP Modeling</title>
        <p>Based on the selected enablers identified for developing a suitable LLM medical education application according to the narrative review of the literature (<xref ref-type="table" rid="table3">Table 3</xref>), the focus group was asked to provide their input for pairwise comparison, and the resultant matrix [A] is presented in <xref ref-type="table" rid="table4">Table 4</xref>.</p>
        <p>Once the initial comparison matrix was determined, the matrix was normalized and an average of each row was taken to calculate the priority weight [X]. The normalized matrix, priority weight, and rank of the enablers are given in <xref ref-type="table" rid="table5">Table 5</xref>. The priority weight, as the eigenvector, was further used to calculate the consistency ratio (CR).</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Summary of reported enablers of large language models for medical education.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="140"/>
            <col width="140"/>
            <col width="600"/>
            <col width="120"/>
            <thead>
              <tr valign="top">
                <td>Enabler code</td>
                <td>Enabler</td>
                <td>Description</td>
                <td>References</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>E1</td>
                <td>Cost</td>
                <td>Cost of computation, including hardware, software, and energy requirement</td>
                <td>[<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]</td>
              </tr>
              <tr valign="top">
                <td>E2</td>
                <td>Usability</td>
                <td>User-centric design, ease of use, and positive user experiences</td>
                <td>[<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]</td>
              </tr>
              <tr valign="top">
                <td>E3</td>
                <td>Credibility</td>
                <td>Level of trust and reliability that users place in the application</td>
                <td>[<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]</td>
              </tr>
              <tr valign="top">
                <td>E4</td>
                <td>Fairness</td>
                <td>Absence of unfair discrimination, physical harm, and harm to user reputation</td>
                <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]</td>
              </tr>
              <tr valign="top">
                <td>E5</td>
                <td>Accountability</td>
                <td>Taking responsibility for the obligation to treat users with honesty and morality</td>
                <td>[<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]</td>
              </tr>
              <tr valign="top">
                <td>E6</td>
                <td>Transparency</td>
                <td>Functioning in a way that makes it simple for others to observe what actions are taken</td>
                <td>[<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]</td>
              </tr>
              <tr valign="top">
                <td>E7</td>
                <td>Explainability</td>
                <td>Ability to describe how the models came to their conclusion</td>
                <td>[<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Initial pairwise comparison matrix for the analytical hierarchy process.a</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="100"/>
            <col width="80"/>
            <col width="110"/>
            <col width="120"/>
            <col width="110"/>
            <col width="170"/>
            <col width="150"/>
            <col width="160"/>
            <thead>
              <tr valign="top">
                <td>Enablers</td>
                <td>Cost (E1)</td>
                <td>Usability (E2)</td>
                <td>Credibility (E3)</td>
                <td>Fairness (E4)</td>
                <td>Accountability (E5)</td>
                <td>Transparency (E6)</td>
                <td>Explainability (E7)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>E1</td>
                <td>1</td>
                <td>3</td>
                <td>0.2</td>
                <td>1</td>
                <td>0.2</td>
                <td>3</td>
                <td>3</td>
              </tr>
              <tr valign="top">
                <td>E2</td>
                <td>0.33</td>
                <td>1</td>
                <td>0.11</td>
                <td>0.33</td>
                <td>0.11</td>
                <td>1</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>E3</td>
                <td>5</td>
                <td>9</td>
                <td>1</td>
                <td>5</td>
                <td>5</td>
                <td>3</td>
                <td>3</td>
              </tr>
              <tr valign="top">
                <td>E4</td>
                <td>1</td>
                <td>3</td>
                <td>0.2</td>
                <td>1</td>
                <td>0.2</td>
                <td>3</td>
                <td>3</td>
              </tr>
              <tr valign="top">
                <td>E5</td>
                <td>5</td>
                <td>9</td>
                <td>0.2</td>
                <td>5</td>
                <td>1</td>
                <td>5</td>
                <td>5</td>
              </tr>
              <tr valign="top">
                <td>E6</td>
                <td>0.33</td>
                <td>1</td>
                <td>0.33</td>
                <td>0.33</td>
                <td>0.2</td>
                <td>1</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>E7</td>
                <td>0.33</td>
                <td>1</td>
                <td>0.33</td>
                <td>0.33</td>
                <td>0.2</td>
                <td>0.2</td>
                <td>1</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>Numbers represent the pairwise comparison of different enablers using the scale developed by Saaty [<xref ref-type="bibr" rid="ref34">34</xref>].</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Normalized matrix and priority weight of enablers.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="80"/>
            <col width="90"/>
            <col width="90"/>
            <col width="120"/>
            <col width="90"/>
            <col width="140"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="60"/>
            <thead>
              <tr valign="top">
                <td>Enablers</td>
                <td>Cost (E1)</td>
                <td>Usability (E2)</td>
                <td>Credibility (E3)</td>
                <td>Fairness (E4)</td>
                <td>Accountability (E5)</td>
                <td>Transparency (E6)</td>
                <td>Explainability (E7)</td>
                <td>Priority weight</td>
                <td>Rank</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>E1</td>
                <td>0.077</td>
                <td>0.1111</td>
                <td>0.0844</td>
                <td>0.077</td>
                <td>0.0289</td>
                <td>0.1852</td>
                <td>0.1765</td>
                <td>0.10572</td>
                <td>3</td>
              </tr>
              <tr valign="top">
                <td>E2</td>
                <td>0.0254</td>
                <td>0.037</td>
                <td>0.0464</td>
                <td>0.026</td>
                <td>0.0159</td>
                <td>0.0617</td>
                <td>0.0588</td>
                <td>0.03871</td>
                <td>7</td>
              </tr>
              <tr valign="top">
                <td>E3</td>
                <td>0.3849</td>
                <td>0.3333</td>
                <td>0.4219</td>
                <td>0.385</td>
                <td>0.7236</td>
                <td>0.1852</td>
                <td>0.1765</td>
                <td>0.37289</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td>E4</td>
                <td>0.077</td>
                <td>0.1111</td>
                <td>0.0844</td>
                <td>0.077</td>
                <td>0.0289</td>
                <td>0.1852</td>
                <td>0.1765</td>
                <td>0.10572</td>
                <td>3</td>
              </tr>
              <tr valign="top">
                <td>E5</td>
                <td>0.3849</td>
                <td>0.3333</td>
                <td>0.0844</td>
                <td>0.385</td>
                <td>0.1447</td>
                <td>0.3086</td>
                <td>0.2941</td>
                <td>0.27642</td>
                <td>2</td>
              </tr>
              <tr valign="top">
                <td>E6</td>
                <td>0.0254</td>
                <td>0.037</td>
                <td>0.1392</td>
                <td>0.025</td>
                <td>0.0289</td>
                <td>0.0617</td>
                <td>0.0588</td>
                <td>0.0538</td>
                <td>5</td>
              </tr>
              <tr valign="top">
                <td>E7</td>
                <td>0.0254</td>
                <td>0.037</td>
                <td>0.1392</td>
                <td>0.025</td>
                <td>0.0289</td>
                <td>0.0123</td>
                <td>0.0588</td>
                <td>0.04674</td>
                <td>6</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>Based on this matrix, the eigenvector X was calculated according to the following equation:</p>
        <disp-formula>
        [A] X = <italic>λ<sub>max</sub></italic> X – (1)
        </disp-formula>
        <p>Using the data in <xref ref-type="table" rid="table4">Tables 4</xref> and <xref ref-type="table" rid="table5">5</xref>, <italic>λ<sub>max</sub></italic> was obtained as follows:</p>
        <disp-formula>
        [A]X = [0.76, 0.28, 3.46, 0.76, 2.26, 0.39, 0.34] – (2)
           </disp-formula>
        <disp-formula><italic>λ<sub>max</sub></italic> = average {0.76/0.11, 0.24/0.04, 3.46/0.37, 0.76/0.11, 0.39/0.05, 0.34/0.05} – (3)
        </disp-formula>
        <disp-formula><italic>λ<sub>max</sub></italic> = 7.66 – (4)
        </disp-formula>
        <p>The consistency index (CI) was then calculated based on the <italic>λ<sub>max</sub></italic> as follows: CI = (7.66 – 7)/6 = 0.11 – (5). Finally, the CR of the judgment was calculated by dividing the CI by the random index (RI). The RI value for a 7×7 matrix is 1.32 from the RI table. Thus, the CR becomes 0.084; as this is less than 0.1, it is considered to be acceptable.</p>
      </sec>
      <sec>
        <title>Modeling Relationships Among Enablers</title>
        <p>We further used TISM for ascertaining the relationships among these seven enablers. <xref ref-type="table" rid="table6">Table 6</xref> shows a matrix indicating the interrelationships between the enablers listed in <xref ref-type="table" rid="table3">Table 3</xref>, with “Y” indicating the existence of a relationship and “N” indicating no relationship. The resultant matrix is referred to as the structural self-interaction matrix.</p>
        <p>In the next step, we replaced all “Ys” with 1s and all “Ns” with 0s and incorporated the transitivity rule to obtain the final reachability matrix shown in <xref ref-type="table" rid="table7">Table 7</xref>.</p>
        <p>The next step in developing LLMs for medical education involved listing reachability and antecedent sets for each enabler, followed by level partitioning, which is an iterative process of assigning enablers at different levels. Enablers with similar intersection sets as reachability sets are placed at the top level. The process is then repeated until levels are established for all enablers. In this study, all enablers were assigned after three iterations; hence, there are three levels in the hierarchy. The summary of level partitioning is provided in <xref ref-type="table" rid="table8">Table 8</xref>. The level of an enabler is a reflection of its driving power and dependence power, as indicated in <xref ref-type="table" rid="table7">Table 7</xref>. The higher the level of the enabler, the more dependent it is, whereas the driving ability improves when moving to lower levels.</p>
        <p>Once the level partitioning was complete, the TISM was developed and presented to the focus group for validation. Only significant transitive links were included in the model to facilitate interpretation. The final digraph for the TISM developed in the study is depicted in <xref rid="figure2" ref-type="fig">Figure 2</xref>.</p>
        <table-wrap position="float" id="table6">
          <label>Table 6</label>
          <caption>
            <p>Structural self-interaction matrix for the identified enablers of large language models for medical education.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="100"/>
            <col width="80"/>
            <col width="110"/>
            <col width="120"/>
            <col width="110"/>
            <col width="160"/>
            <col width="150"/>
            <col width="170"/>
            <thead>
              <tr valign="top">
                <td>Enablers</td>
                <td>Cost (E1)</td>
                <td>Usability (E2)</td>
                <td>Credibility (E3)</td>
                <td>Fairness (E4)</td>
                <td>Accountability (E5)</td>
                <td>Transparency (E6)</td>
                <td>Explainability (E7)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>E1</td>
                <td>Y<sup>a</sup></td>
                <td>Y</td>
                <td>N<sup>b</sup></td>
                <td>N</td>
                <td>N</td>
                <td>Y</td>
                <td>N</td>
              </tr>
              <tr valign="top">
                <td>E2</td>
                <td>Y</td>
                <td>Y</td>
                <td>N</td>
                <td>N</td>
                <td>N</td>
                <td>Y</td>
                <td>Y</td>
              </tr>
              <tr valign="top">
                <td>E3</td>
                <td>N</td>
                <td>N</td>
                <td>Y</td>
                <td>Y</td>
                <td>Y</td>
                <td>N</td>
                <td>N</td>
              </tr>
              <tr valign="top">
                <td>E4</td>
                <td>N</td>
                <td>N</td>
                <td>Y</td>
                <td>Y</td>
                <td>N</td>
                <td>N</td>
                <td>N</td>
              </tr>
              <tr valign="top">
                <td>E5</td>
                <td>N</td>
                <td>N</td>
                <td>Y</td>
                <td>N</td>
                <td>Y</td>
                <td>N</td>
                <td>N</td>
              </tr>
              <tr valign="top">
                <td>E6</td>
                <td>Y</td>
                <td>Y</td>
                <td>N</td>
                <td>N</td>
                <td>N</td>
                <td>Y</td>
                <td>Y</td>
              </tr>
              <tr valign="top">
                <td>E7</td>
                <td>N</td>
                <td>Y</td>
                <td>N</td>
                <td>N</td>
                <td>N</td>
                <td>Y</td>
                <td>Y</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table6fn1">
              <p><sup>a</sup>Y: existence of a relationship between two enablers.</p>
            </fn>
            <fn id="table6fn2">
              <p><sup>b</sup>N: no relationship exists between two enablers.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table7">
          <label>Table 7</label>
          <caption>
            <p>Final reachability matrix of the enablers for developing large language models in medical education.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="160"/>
            <col width="80"/>
            <col width="80"/>
            <col width="90"/>
            <col width="80"/>
            <col width="150"/>
            <col width="110"/>
            <col width="110"/>
            <col width="140"/>
            <thead>
              <tr valign="top">
                <td>Enablers</td>
                <td>Cost (E1)</td>
                <td>Usability (E2)</td>
                <td>Credibility (E3)</td>
                <td>Fairness (E4)</td>
                <td>Accountability (E5)</td>
                <td>Transparency (E6)</td>
                <td>Explainability (E7)</td>
                <td>Driving power</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>E1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>4</td>
              </tr>
              <tr valign="top">
                <td>E2</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>4</td>
              </tr>
              <tr valign="top">
                <td>E3</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>3</td>
              </tr>
              <tr valign="top">
                <td>E4</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>2</td>
              </tr>
              <tr valign="top">
                <td>E5</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>2</td>
              </tr>
              <tr valign="top">
                <td>E6</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>4</td>
              </tr>
              <tr valign="top">
                <td>E7</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>3</td>
              </tr>
              <tr valign="top">
                <td>Dependence power</td>
                <td>3</td>
                <td>4</td>
                <td>3</td>
                <td>2</td>
                <td>2</td>
                <td>4</td>
                <td>4</td>
                <td>Not applicable</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table8">
          <label>Table 8</label>
          <caption>
            <p>Summary of label partitioning iterations (1 to 6).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="200"/>
            <col width="190"/>
            <col width="190"/>
            <col width="240"/>
            <col width="180"/>
            <thead>
              <tr valign="top">
                <td>Enablers, (Mi)</td>
                <td>Reachability set, R(Mi)</td>
                <td>Antecedent set, A(Ni)</td>
                <td>Intersection set, R(Mi)∩A(Ni)</td>
                <td>Level</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>III</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>1, 2, 6, 7</td>
                <td>1, 2, 6, 7</td>
                <td>1, 2, 6, 7</td>
                <td>I</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>3, 4, 5</td>
                <td>3, 4, 5</td>
                <td>3, 4, 5</td>
                <td>I</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>3, 4</td>
                <td>3, 4</td>
                <td>3, 4</td>
                <td>I</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>3, 5</td>
                <td>3, 5</td>
                <td>3, 5</td>
                <td>I</td>
              </tr>
              <tr valign="top">
                <td>6</td>
                <td>1, 2, 6, 7</td>
                <td>1, 2, 6, 7</td>
                <td>1, 2, 6, 7</td>
                <td>I</td>
              </tr>
              <tr valign="top">
                <td>7</td>
                <td>7</td>
                <td>1, 7</td>
                <td>7</td>
                <td>II</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Diagraph of the total interpretive structural model for the development of large language models in medical education.</p>
          </caption>
          <graphic xlink:href="ai_v3i1e51834_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Validation Analysis</title>
        <p>We further used MICMAC analysis to validate the study findings and derive conclusions. MICMAC analysis involves the development of a graph that classifies enablers based on their driving and dependence power. As shown in <xref rid="figure3" ref-type="fig">Figure 3</xref>, the first quadrant contains autonomous enablers E3 (Credibility), E4 (Fairness), and E6 (Accountability), indicating that the variables falling in this quadrant have low driving and dependence powers. The two enablers falling in the grey region between the third (linkage) and fourth (independent) quadrants are E2 (Usability) and E6 (Transparency), which have medium driving and dependence powers. Similarly, E7 (Explainability) falls in the grey region between the first (autonomous) and second (dependent) variables. Finally, E1 (Cost) falls under the fourth (independent) quadrant.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Cross-impact matrix-based multiplication applied to a classification (MICMAC) analysis for enablers of a large language model in medical education. I-IV indicate different levels of the enablers E1-E7. E1: cost; E2: usability; E3: credibility; E4: fairness; E5: accountability; E6: transparency; E7: explainability.</p>
          </caption>
          <graphic xlink:href="ai_v3i1e51834_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>The results of the AHP suggested that credibility, followed by accountability are the foremost enablers for effective LLMs in medical education. The extant literature supports this finding, in highlighting the relevance of the source of information based on which the response was generated [<xref ref-type="bibr" rid="ref39">39</xref>]. Similarly, the importance of defining accountability has been emphasized in the recent literature. For example, Tan et al [<xref ref-type="bibr" rid="ref40">40</xref>] advocate for accountability as an important factor in increasing the adoption of LLMs in medical education, training, and practice. The next most important factors to consider are ethical issues such as fairness and cost. LLMs have been criticized for bias against gender or ethnic groups [<xref ref-type="bibr" rid="ref17">17</xref>]. These problems need to be addressed to make LLMs effective in medical education. Moreover, training LLMs on billions of parameters is demanding; thus, only technology giants will launch these LLMs [<xref ref-type="bibr" rid="ref41">41</xref>]. Governments should therefore ensure that the cost of using these LLMs does not become prohibitive for end users, who may resort to insufficient solutions that could ultimately affect the safety of patients.</p>
        <p>In contrast to existing studies, transparency and explainability ranked fifth and sixth in importance in our analysis [<xref ref-type="bibr" rid="ref40">40</xref>]. Many best practices related to health technology suggest that models should use explainable AI in medical devices [<xref ref-type="bibr" rid="ref17">17</xref>]. The low priority of these enablers identified in this study indicates that the end user is unaware of the criticality of these factors; thus, health care professionals need to be educated about these issues as they are not technology savvy [<xref ref-type="bibr" rid="ref42">42</xref>]. Governments should also establish guidelines for the approval of Software as Medical Devices so that these enablers are taken care of at the product development stage. Finally, the focus group indicated that usability is the least important factor among the seven enablers discussed. Although general-purpose LLMs such as ChatGPT are less cluttered, their performance is input-dependent. Improving the prompt use of the recommendation system can enhance the usability and accuracy of LLMs in medical education [<xref ref-type="bibr" rid="ref43">43</xref>]. The expert group advised that the LLMs will improve on these factors with time.</p>
        <p>The results from TISM suggested a slight difference in the perspective of product developers and end users, as the experts gave equal importance to the enablers credibility, fairness, accountability, transparency, and explainability. These results are consistent with extant literature published in peer-reviewed journals [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>], as these are all features related to model development and training.</p>
        <p>In contrast to earlier studies, the product developers and technology experts placed less significance on usability as an enabler, which was given a medium level [<xref ref-type="bibr" rid="ref43">43</xref>]. Thus, the finding of the TISM validates the results of the AHP. The only difference was that cost was considered as the least important enabler for product developers. However, a recent study indicated that economic and environmental costs are significant factors in developing general-purpose LLMs [<xref ref-type="bibr" rid="ref44">44</xref>].</p>
        <p>Successful LLM development involves a complex interplay among technical innovation, regulatory compliance, production costs, and end-user needs. The aim should be to develop products that excel in functionality and positively impact the lives of those who rely on them without causing financial hardship. Thus, this study calls for collaboration between product developers, original equipment manufacturers, regulators, and other stakeholders to find solutions that align with technological advancements and societal expectations for affordability and accessibility.</p>
        <p>Finally, the findings of this study were validated using MICMAC analysis, creating a graph that categorizes enablers based on their driving power and dependence power. In this graph, the enablers credibility, fairness, and accountability are in the first quadrant (autonomous) with low power, indicating that these variables are relatively independent and have limited influence on other variables. Usability and transparency are in the grey region between the third (linkage) and fourth (independent) quadrants with medium power, indicating a moderate influence on other variables and similarly influenced by them. Explainability falls in the grey region between the first (autonomous) and second (dependent) quadrants, also indicating a medium influence on other variables and a similar influence on them. Finally, cost falls under the fourth quadrant (independent), suggesting that it strongly influences other enablers without being significantly influenced by them. MICMAC analysis comprehensively explains the relationships and dynamics among variables within a complex system. This can help decision makers identify key drivers, dependencies, and interactions, enabling them to make informed strategic decisions and allocate resources effectively.</p>
      </sec>
      <sec>
        <title>Practical and Theoretical Implications</title>
        <p>The study has one implication each for theory and for practice. For theory, this study extends the Fairness, Accountability, Transparency, and Explainability (FATE) framework [<xref ref-type="bibr" rid="ref45">45</xref>] into a more comprehensive Cost, Usability, Credibility, Fairness, Accountability, Transparency, and Explainability (CUC-FATE) framework for developing LLMs for health care professionals. With respect to the implication for practice, this study is the first of its kind and provides a prescriptive framework for developing LLMs in health care, especially medical education. The findings of this study are useful for policy makers, medical device regulators, education policy makers, health care professionals, and product developers at the helm of creating Software as a Medical Device.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>One of the limitations of the study is that the results largely rely on experts from India and the United Arab Emirates. Although technology and health care practices are standardized globally, the findings should only be generalized to the populations from these regions. This study provides insight into the relationships between different enablers but we did not further evaluate the strength of these associations. Graph theory or structured equation modeling can be used to address these gaps in future studies.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>This study emphasizes key factors for effective LLMs in medical education: credibility and accountability are vital enablers, while addressing bias and cost is crucial for enhancing LLM potential. Although important, transparency and explainability rank lower as LLM enablers among health professionals, suggesting a need for further education on this technology. Usability emerged as the least important factor; however, enhancing prompt use improves LLM accuracy. This study highlights a slight difference between product developers and end users. Although both groups prioritize credibility, fairness, accountability, transparency, and explainability, usability ranks lower for developers. Successful LLM development must balance innovation, compliance, costs, and user needs. Collaboration among stakeholders is crucial for aligning with technology and societal expectations.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AHP</term>
          <def>
            <p>analytical hierarchy process</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CI</term>
          <def>
            <p>consistency index</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">CR</term>
          <def>
            <p>consistency ratio</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">CUC-FATE</term>
          <def>
            <p>Cost, Usability, Credibility, Fairness, Accountability, Transparency, and Explainability</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">FATE</term>
          <def>
            <p>Fairness, Accountability, Transparency, and Explainability</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">MICMAC</term>
          <def>
            <p>cross-impact matrix multiplication applied to classification</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">RI</term>
          <def>
            <p>random index</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">TISM</term>
          <def>
            <p>total interpretive structural modeling</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors are highly indebted to all focus group participants for their time and effort. The authors are also obliged to their respective institutions for the infrastructural support provided. The authors disclose using the artificial intelligence tools Grammarly and Quillbot for manuscript language editing. The article processing charges for the publication of the manuscript are funded by the College of Business Administration, Kuwait University.</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The necessary data and calculations for the analytic hierarchy process model and the self-interaction matrix for the total interpretive structural model are available on a GitHub repository [<xref ref-type="bibr" rid="ref46">46</xref>].</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>Conceptualization: VM, MQ, S Madkam, YL, and S Mark; Data curation: VM, S Madakam; Formal Analysis: VM, YL, and S Mark; Funding acquisition: MQ; Methodology: VM, MQ; Project administration: MQ; Supervision: YL and S Mark; Validation: YL and S Mark; Visualization: VM; Writing––original draft: VM, MQ; Writing––review &#38; editing: YM and S Mark.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haque</surname>
              <given-names>MUI</given-names>
            </name>
            <name name-style="western">
              <surname>Dharmadasa</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Sworna</surname>
              <given-names>ZT</given-names>
            </name>
            <name name-style="western">
              <surname>Rajapakse</surname>
              <given-names>RN</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmad</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>"I think this is the most disruptive technology": exploring sentiments of ChatGPT early adopters using Twitter data</article-title>
          <source>arXiv</source>
          <year>2022</year>
          <access-date>2023-12-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2212.05856">https://arxiv.org/abs/2212.05856</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nastasi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Courtright</surname>
              <given-names>KR</given-names>
            </name>
            <name name-style="western">
              <surname>Halpern</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Weissman</surname>
              <given-names>GE</given-names>
            </name>
          </person-group>
          <article-title>A vignette-based evaluation of ChatGPT's ability to provide appropriate and equitable medical advice across care contexts</article-title>
          <source>Sci Rep</source>
          <year>2023</year>
          <month>10</month>
          <day>19</day>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>17885</fpage>
          <pub-id pub-id-type="doi">10.1038/s41598-023-45223-y</pub-id>
          <pub-id pub-id-type="medline">37857839</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-023-45223-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC10587094</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Qiang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ge</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Summary of ChatGPT-related research and perspective towards the future of large language models</article-title>
          <source>Meta-Radiology</source>
          <year>2023</year>
          <month>09</month>
          <volume>1</volume>
          <issue>2</issue>
          <fpage>100017</fpage>
          <pub-id pub-id-type="doi">10.1016/j.metrad.2023.100017</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hagendorff</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Machine psychology: investigating emergent capabilities and behavior in large language models using psychological methods</article-title>
          <source>arXiv</source>
          <year>2023</year>
          <month>03</month>
          <access-date>2023-12-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2303.13988">https://arxiv.org/abs/2303.13988</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Májovský</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Černý</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kasal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Komarc</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Netuka</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence can generate fraudulent but authentic-looking scientific medical articles: Pandora's box has been opened</article-title>
          <source>J Med Internet Res</source>
          <year>2023</year>
          <month>05</month>
          <day>31</day>
          <volume>25</volume>
          <fpage>e46924</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2023//e46924/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/46924</pub-id>
          <pub-id pub-id-type="medline">37256685</pub-id>
          <pub-id pub-id-type="pii">v25i1e46924</pub-id>
          <pub-id pub-id-type="pmcid">PMC10267787</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mann</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ryder</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Subbiah</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kaplan</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Dhariwal</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Neelakantan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shyam</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sastry</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Askell</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Agarwal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Herbert-Voss</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Krueger</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Henighan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Child</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ramesh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ziegler</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Winter</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hesse</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sigler</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Litwin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gray</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chess</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Berner</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>McCandlish</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Radford</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sutskever</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Amodei</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Language models are few-shot learners</article-title>
          <year>2020</year>
          <conf-name>NIPS'20: 34th International Conference on Neural Information Processing Systems</conf-name>
          <conf-date>December 6-12, 2020</conf-date>
          <conf-loc>Vancouver, BC</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>May</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bordia</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bowman</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Rudinger</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>On measuring social biases in sentence encoders</article-title>
          <source>arXiv</source>
          <year>2019</year>
          <access-date>2023-12-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1903.10561">https://arxiv.org/abs/1903.10561</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>August</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>LL</given-names>
            </name>
            <name name-style="western">
              <surname>Bragg</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hearst</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Head</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lo</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Paper plain: Making medical research papers approachable to healthcare consumers with natural language processing</article-title>
          <source>ACM Trans Comput Hum Interact</source>
          <year>2023</year>
          <month>09</month>
          <day>23</day>
          <volume>30</volume>
          <issue>5</issue>
          <fpage>1</fpage>
          <lpage>38</lpage>
          <pub-id pub-id-type="doi">10.1145/3589955</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kaelin</surname>
              <given-names>VC</given-names>
            </name>
            <name name-style="western">
              <surname>Valizadeh</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Salgado</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Parde</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Khetani</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence in rehabilitation targeting the participation of children and youth with disabilities: scoping review</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>11</month>
          <day>04</day>
          <volume>23</volume>
          <issue>11</issue>
          <fpage>e25745</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/11/e25745/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/25745</pub-id>
          <pub-id pub-id-type="medline">34734833</pub-id>
          <pub-id pub-id-type="pii">v23i11e25745</pub-id>
          <pub-id pub-id-type="pmcid">PMC8603165</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Iroju</surname>
              <given-names>OG</given-names>
            </name>
            <name name-style="western">
              <surname>Olaleke</surname>
              <given-names>JO</given-names>
            </name>
          </person-group>
          <article-title>A systematic review of natural language processing in healthcare</article-title>
          <source>Int J Inf Technol Comput Sci</source>
          <year>2015</year>
          <month>07</month>
          <day>08</day>
          <volume>7</volume>
          <issue>8</issue>
          <fpage>44</fpage>
          <lpage>50</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mecs-press.org/ijitcs/ijitcs-v7-n8/IJITCS-V7-N8-7.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.5815/ijitcs.2015.08.07</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lavanya</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sasikala</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Deep learning techniques on text classification using natural language processing (NLP) in social healthcare network: a comprehensive survey</article-title>
          <year>2021</year>
          <conf-name>3rd International Conference on Signal Processing and Communication (ICPSC)</conf-name>
          <conf-date>May 13-14, 2021</conf-date>
          <conf-loc>Coimbatore, India</conf-loc>
          <pub-id pub-id-type="doi">10.1109/icspc51351.2021.9451752</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sallam</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT utility in healthcare education, research, and practice: systematic review on the promising perspectives and valid concerns</article-title>
          <source>Healthcare</source>
          <year>2023</year>
          <month>03</month>
          <day>19</day>
          <volume>11</volume>
          <issue>6</issue>
          <fpage>887</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=healthcare11060887"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/healthcare11060887</pub-id>
          <pub-id pub-id-type="medline">36981544</pub-id>
          <pub-id pub-id-type="pii">healthcare11060887</pub-id>
          <pub-id pub-id-type="pmcid">PMC10048148</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Seetharaman</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Revolutionizing medical education: can ChatGPT boost subjective learning and expression?</article-title>
          <source>J Med Syst</source>
          <year>2023</year>
          <month>05</month>
          <day>09</day>
          <volume>47</volume>
          <issue>1</issue>
          <fpage>61</fpage>
          <pub-id pub-id-type="doi">10.1007/s10916-023-01957-w</pub-id>
          <pub-id pub-id-type="medline">37160568</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10916-023-01957-w</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Grabb</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT in medical education: a paradigm shift or a dangerous tool?</article-title>
          <source>Acad Psychiatry</source>
          <year>2023</year>
          <month>08</month>
          <volume>47</volume>
          <issue>4</issue>
          <fpage>439</fpage>
          <lpage>440</lpage>
          <pub-id pub-id-type="doi">10.1007/s40596-023-01791-9</pub-id>
          <pub-id pub-id-type="medline">37160840</pub-id>
          <pub-id pub-id-type="pii">10.1007/s40596-023-01791-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kleebayoon</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wiwanitkit</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT in medical practice, education and research: malpractice and plagiarism</article-title>
          <source>Clin Med</source>
          <year>2023</year>
          <month>05</month>
          <volume>23</volume>
          <issue>3</issue>
          <fpage>280</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.rcpjournals.org/lookup/pmid/37236804"/>
          </comment>
          <pub-id pub-id-type="doi">10.7861/clinmed.Let.23.3.2</pub-id>
          <pub-id pub-id-type="medline">37236804</pub-id>
          <pub-id pub-id-type="pii">23/3/280-a</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Utility of ChatGPT in clinical practice</article-title>
          <source>J Med Internet Res</source>
          <year>2023</year>
          <month>06</month>
          <day>28</day>
          <volume>25</volume>
          <fpage>e48568</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2023//e48568/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/48568</pub-id>
          <pub-id pub-id-type="medline">37379067</pub-id>
          <pub-id pub-id-type="pii">v25i1e48568</pub-id>
          <pub-id pub-id-type="pmcid">PMC10365580</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ray</surname>
              <given-names>PP</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT: a comprehensive review on background, applications, key challenges, bias, ethics, limitations and future scope</article-title>
          <source>Internet of Things Cyber-Physical Syst</source>
          <year>2023</year>
          <volume>3</volume>
          <fpage>121</fpage>
          <lpage>154</lpage>
          <pub-id pub-id-type="doi">10.1016/j.iotcps.2023.04.003</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Milano</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>McGrane</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Leonelli</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Large language models challenge the future of higher education</article-title>
          <source>Nat Mach Intell</source>
          <year>2023</year>
          <month>03</month>
          <day>31</day>
          <volume>5</volume>
          <issue>4</issue>
          <fpage>333</fpage>
          <lpage>334</lpage>
          <pub-id pub-id-type="doi">10.1038/s42256-023-00644-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ran</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Deep learning with edge computing: a review</article-title>
          <source>Proc IEEE</source>
          <year>2019</year>
          <month>8</month>
          <volume>107</volume>
          <issue>8</issue>
          <fpage>1655</fpage>
          <lpage>1674</lpage>
          <pub-id pub-id-type="doi">10.1109/jproc.2019.2921977</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bharany</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Khalaf</surname>
              <given-names>OI</given-names>
            </name>
            <name name-style="western">
              <surname>Abdulsahib</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Al Humaimeedy</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Aldhyani</surname>
              <given-names>THH</given-names>
            </name>
            <name name-style="western">
              <surname>Maashi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Alkahtani</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>A systematic survey on energy-efficient techniques in sustainable cloud computing</article-title>
          <source>Sustainability</source>
          <year>2022</year>
          <month>05</month>
          <day>20</day>
          <volume>14</volume>
          <issue>10</issue>
          <fpage>6256</fpage>
          <pub-id pub-id-type="doi">10.3390/su14106256</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Potrebny</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Larun</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ciliska</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Olsen</surname>
              <given-names>NR</given-names>
            </name>
          </person-group>
          <article-title>Usability methods and attributes reported in usability studies of mobile apps for health care education: scoping review</article-title>
          <source>JMIR Med Educ</source>
          <year>2022</year>
          <month>06</month>
          <day>29</day>
          <volume>8</volume>
          <issue>2</issue>
          <fpage>e38259</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2022/2/e38259/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/38259</pub-id>
          <pub-id pub-id-type="medline">35767323</pub-id>
          <pub-id pub-id-type="pii">v8i2e38259</pub-id>
          <pub-id pub-id-type="pmcid">PMC9280458</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidt</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Usability research in educational technology: a state-of-the-art systematic review</article-title>
          <source>Education Tech Research Dev</source>
          <year>2022</year>
          <month>08</month>
          <day>22</day>
          <volume>70</volume>
          <issue>6</issue>
          <fpage>1951</fpage>
          <lpage>1992</lpage>
          <pub-id pub-id-type="doi">10.1007/s11423-022-10152-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hein</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Glombiewski</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Rief</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Riecke</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Effects of a video intervention on physicians' acceptance of pain apps: a randomised controlled trial</article-title>
          <source>BMJ Open</source>
          <year>2022</year>
          <month>04</month>
          <day>25</day>
          <volume>12</volume>
          <issue>4</issue>
          <fpage>e060020</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopen.bmj.com/lookup/pmidlookup?view=long&#38;pmid=35470200"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2021-060020</pub-id>
          <pub-id pub-id-type="medline">35470200</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2021-060020</pub-id>
          <pub-id pub-id-type="pmcid">PMC9039411</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Skalidis</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Muller</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Fournier</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>CardioVerse: the cardiovascular medicine in the era of Metaverse</article-title>
          <source>Trends Cardiovasc Med</source>
          <year>2023</year>
          <month>11</month>
          <volume>33</volume>
          <issue>8</issue>
          <fpage>471</fpage>
          <lpage>476</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1050-1738(22)00071-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.tcm.2022.05.004</pub-id>
          <pub-id pub-id-type="medline">35568263</pub-id>
          <pub-id pub-id-type="pii">S1050-1738(22)00071-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lund</surname>
              <given-names>BD</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Chatting about ChatGPT: how may AI and GPT impact academia and libraries?</article-title>
          <source>Library High Tech News</source>
          <year>2023</year>
          <month>02</month>
          <day>14</day>
          <volume>40</volume>
          <issue>3</issue>
          <fpage>26</fpage>
          <lpage>29</lpage>
          <pub-id pub-id-type="doi">10.1108/lhtn-01-2023-0009</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Fairness-guided few-shot prompting for large language models</article-title>
          <source>arXiv</source>
          <year>2023</year>
          <month>03</month>
          <access-date>2023-12-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2303.13217">https://arxiv.org/abs/2303.13217</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hébert</surname>
              <given-names>PC</given-names>
            </name>
            <name name-style="western">
              <surname>MacDonald</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Flegel</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Stanbrook</surname>
              <given-names>MB</given-names>
            </name>
          </person-group>
          <article-title>Competing interests and undergraduate medical education: time for transparency</article-title>
          <source>CMAJ</source>
          <year>2010</year>
          <month>09</month>
          <day>07</day>
          <volume>182</volume>
          <issue>12</issue>
          <fpage>1279</fpage>
          <lpage>1279</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.cmaj.ca/cgi/pmidlookup?view=long&#38;pmid=20457768"/>
          </comment>
          <pub-id pub-id-type="doi">10.1503/cmaj.100605</pub-id>
          <pub-id pub-id-type="medline">20457768</pub-id>
          <pub-id pub-id-type="pii">cmaj.100605</pub-id>
          <pub-id pub-id-type="pmcid">PMC2934787</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Merrill</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Beltagy</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>NA</given-names>
            </name>
          </person-group>
          <article-title>Transparency helps reveal when language models learn meaning</article-title>
          <source>Trans Assoc Comput Ling</source>
          <year>2023</year>
          <volume>11</volume>
          <fpage>617</fpage>
          <lpage>634</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/2023.tacl-1.36.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.1162/tacl_a_00565</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Susnjak</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Beyond predictive learning analytics modelling and onto explainable artificial intelligence with prescriptive analytics and ChatGPT</article-title>
          <source>Int J Artif Intell Educ</source>
          <year>2023</year>
          <month>06</month>
          <day>22</day>
          <fpage>1</fpage>
          <lpage>31</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://link.springer.com/article/10.1007/s40593-023-00336-3#citeas"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s40593-023-00336-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Du</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Shortcut learning of large language models in natural language understanding</article-title>
          <source>Commun ACM</source>
          <year>2023</year>
          <month>12</month>
          <day>21</day>
          <volume>67</volume>
          <issue>1</issue>
          <fpage>110</fpage>
          <lpage>120</lpage>
          <pub-id pub-id-type="doi">10.1145/3596490</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Health technology assessment of telemedicine interventions in diabetes management: evidence from UAE</article-title>
          <source>FIIB Bus Rev</source>
          <year>2022</year>
          <month>11</month>
          <day>29</day>
          <fpage>231971452211306</fpage>
          <pub-id pub-id-type="doi">10.1177/23197145221130651</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dua</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Kulkarni</surname>
              <given-names>SD</given-names>
            </name>
          </person-group>
          <article-title>Modelling perceived risk in blockchain enabled supply chain utilizing fuzzy-AHP</article-title>
          <source>J Glob Oper Strateg Sourc</source>
          <year>2022</year>
          <month>08</month>
          <day>10</day>
          <volume>16</volume>
          <issue>1</issue>
          <fpage>161</fpage>
          <lpage>177</lpage>
          <pub-id pub-id-type="doi">10.1108/jgoss-06-2021-0046</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Rana</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Understanding barriers to inbound medical tourism in the United Arab Emirates from a provider's perspective</article-title>
          <source>Worldw Hosp Tour Themes</source>
          <year>2022</year>
          <month>11</month>
          <day>30</day>
          <volume>15</volume>
          <issue>2</issue>
          <fpage>131</fpage>
          <lpage>142</lpage>
          <pub-id pub-id-type="doi">10.1108/whatt-10-2022-0122</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Estimating relative immediacy of water-related challenges in Small Island Developing States (SIDS) of the Pacific Ocean using AHP modeling</article-title>
          <source>Model Earth Syst Environ</source>
          <year>2019</year>
          <month>11</month>
          <day>02</day>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>201</fpage>
          <lpage>214</lpage>
          <pub-id pub-id-type="doi">10.1007/s40808-019-00671-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Groenland</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <source>Qualitative methodologies and data collection methods: Toward increased rigour in management research</source>
          <year>2019</year>
          <publisher-loc>Singapore</publisher-loc>
          <publisher-name>World Scientific</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>Sushil</collab>
          </person-group>
          <article-title>Interpreting the Interpretive Structural Model</article-title>
          <source>Glob J Flex Syst Manag</source>
          <year>2012</year>
          <month>9</month>
          <day>18</day>
          <volume>13</volume>
          <issue>2</issue>
          <fpage>87</fpage>
          <lpage>106</lpage>
          <pub-id pub-id-type="doi">10.1007/s40171-012-0008-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Prasad</surname>
              <given-names>UC</given-names>
            </name>
            <name name-style="western">
              <surname>Suri</surname>
              <given-names>RK</given-names>
            </name>
          </person-group>
          <article-title>Modeling of continuity and change forces in private higher technical education using total interpretive structural modeling (TISM)</article-title>
          <source>Global J Flexible Syst Manage</source>
          <year>2017</year>
          <month>10</month>
          <day>4</day>
          <volume>12</volume>
          <issue>3-4</issue>
          <fpage>31</fpage>
          <lpage>39</lpage>
          <pub-id pub-id-type="doi">10.1007/bf03396605</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cacciamani</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Eppler</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Ganjavi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Pekan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Biedermann</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Gill</surname>
              <given-names>IS</given-names>
            </name>
          </person-group>
          <article-title>Development of the ChatGPT, generative artificial intelligence and natural large language models for accountable reporting and use (CANGARU) guidelines</article-title>
          <source>arXiv</source>
          <year>2023</year>
          <month>07</month>
          <access-date>2023-12-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2307.08974">https://arxiv.org/abs/2307.08974</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jamal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Solaiman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Alhasan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Temsah</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Sayed</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Integrating ChatGPT in medical education: adapting curricula to cultivate competent physicians for the AI era</article-title>
          <source>Cureus</source>
          <year>2023</year>
          <month>08</month>
          <volume>15</volume>
          <issue>8</issue>
          <fpage>e43036</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37674966"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.43036</pub-id>
          <pub-id pub-id-type="medline">37674966</pub-id>
          <pub-id pub-id-type="pmcid">PMC10479954</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>LF</given-names>
            </name>
            <name name-style="western">
              <surname>Heng</surname>
              <given-names>JJY</given-names>
            </name>
            <name name-style="western">
              <surname>Teo</surname>
              <given-names>DB</given-names>
            </name>
          </person-group>
          <article-title>Response to: "The next paradigm shift? ChatGPT, artificial intelligence, and medical education"</article-title>
          <source>Medical Teacher</source>
          <year>2023</year>
          <month>09</month>
          <day>13</day>
          <volume>46</volume>
          <issue>1</issue>
          <fpage>151</fpage>
          <lpage>152</lpage>
          <pub-id pub-id-type="doi">10.1080/0142159x.2023.2256961</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rudolph</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>War of the chatbots: Bard, Bing Chat, ChatGPT, Ernie and beyond. The new AI gold rush and its impact on higher education</article-title>
          <source>J Appl Learn Teach</source>
          <year>2023</year>
          <month>4</month>
          <day>25</day>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>364</fpage>
          <lpage>389</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sfu.ca/jalt/index.php/jalt/article/view/771"/>
          </comment>
          <pub-id pub-id-type="doi">10.37074/jalt.2023.6.1.23</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baslom</surname>
              <given-names>MMM</given-names>
            </name>
            <name name-style="western">
              <surname>Tong</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Strategic management of organizational knowledge and employee's awareness about artificial intelligence with mediating effect of learning climate</article-title>
          <source>Int J Comput Intell Syst</source>
          <year>2019</year>
          <volume>12</volume>
          <issue>2</issue>
          <fpage>1585</fpage>
          <pub-id pub-id-type="doi">10.2991/ijcis.d.191025.002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rao</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kamineni</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lie</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Prasad</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Landman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dreyer</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Succi</surname>
              <given-names>MD</given-names>
            </name>
          </person-group>
          <article-title>Assessing the utility of ChatGPT throughout the entire clinical workflow: development and usability study</article-title>
          <source>J Med Internet Res</source>
          <year>2023</year>
          <month>08</month>
          <day>22</day>
          <volume>25</volume>
          <fpage>e48659</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2023//e48659/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/48659</pub-id>
          <pub-id pub-id-type="medline">37606976</pub-id>
          <pub-id pub-id-type="pii">v25i1e48659</pub-id>
          <pub-id pub-id-type="pmcid">PMC10481210</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Krishna</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Awadallah</surname>
              <given-names>AH</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>EcoAssistant: using LLM Assistant more affordably and accurately</article-title>
          <source>arXiv</source>
          <year>2023</year>
          <access-date>2023-12-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2310.03046">https://arxiv.org/abs/2310.03046</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Memarian</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Doleck</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Fairness, Accountability, Transparency, and Ethics (FATE) in artificial intelligence (AI) and higher education: a systematic review</article-title>
          <source>Comput Educ Artific Intell</source>
          <year>2023</year>
          <volume>5</volume>
          <fpage>100152</fpage>
          <pub-id pub-id-type="doi">10.1016/j.caeai.2023.100152</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Data for AHP and TISM models for the CUC-FATE framework</article-title>
          <source>GitHub</source>
          <access-date>2023-12-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/vinaytosh/datasharing/blob/master/Data_CUCFATE.xlsx">https://github.com/vinaytosh/datasharing/blob/master/Data_CUCFATE.xlsx</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
