<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="review-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Educ</journal-id><journal-id journal-id-type="publisher-id">mededu</journal-id><journal-id journal-id-type="index">20</journal-id><journal-title>JMIR Medical Education</journal-title><abbrev-journal-title>JMIR Med Educ</abbrev-journal-title><issn pub-type="epub">2369-3762</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v11i1e71125</article-id><article-id pub-id-type="doi">10.2196/71125</article-id><article-categories><subj-group subj-group-type="heading"><subject>Review</subject></subj-group></article-categories><title-group><article-title>Applications, Challenges, and Prospects of Generative Artificial Intelligence Empowering Medical Education: Scoping Review</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Lin</surname><given-names>Yuhang</given-names></name><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Luo</surname><given-names>Zhiheng</given-names></name><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ye</surname><given-names>Zicheng</given-names></name><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zhong</surname><given-names>Nuoxi</given-names></name><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zhao</surname><given-names>Lijian</given-names></name><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zhang</surname><given-names>Long</given-names></name><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Li</surname><given-names>Xiaolan</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Chen</surname><given-names>Zetao</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Chen</surname><given-names>Yijia</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Guangdong Provincial Key Laboratory of Stomatology, Hospital of Stomatology, Guanghua School of Stomatology, Sun Yat-sen University</institution><addr-line>No. 56, Lingyuan Road West</addr-line><addr-line>Guangzhou</addr-line><country>China</country></aff><aff id="aff2"><institution>Zhongshan School of Medicine, Sun Yat-sen University</institution><addr-line>Guangzhou</addr-line><country>China</country></aff><aff id="aff3"><institution>School of Government, Sun Yat-sen University</institution><addr-line>Guangzhou</addr-line><country>China</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Lesselroth</surname><given-names>Blake</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Mesk&#x00F3;</surname><given-names>Bertalan</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Wang</surname><given-names>Changyu</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Hang</surname><given-names>Ching Nam</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Zhu</surname><given-names>Lingxuan</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Yin</surname><given-names>Rong</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Yijia Chen, PhD, Guangdong Provincial Key Laboratory of Stomatology, Hospital of Stomatology, Guanghua School of Stomatology, Sun Yat-sen University, No. 56, Lingyuan Road West, Guangzhou, 510055, China, 86 13580591020; <email>chenyij9@mail.sysu.edu.cn</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>23</day><month>10</month><year>2025</year></pub-date><volume>11</volume><elocation-id>e71125</elocation-id><history><date date-type="received"><day>10</day><month>01</month><year>2025</year></date><date date-type="rev-recd"><day>26</day><month>07</month><year>2025</year></date><date date-type="accepted"><day>23</day><month>09</month><year>2025</year></date></history><copyright-statement>&#x00A9; Yuhang Lin, Zhiheng Luo, Zicheng Ye, Nuoxi Zhong, Lijian Zhao, Long Zhang, Xiaolan Li, Zetao Chen, Yijia Chen. Originally published in JMIR Medical Education (<ext-link ext-link-type="uri" xlink:href="https://mededu.jmir.org">https://mededu.jmir.org</ext-link>), 23.10.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Education, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://mededu.jmir.org/">https://mededu.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://mededu.jmir.org/2025/1/e71125"/><abstract><sec><title>Background</title><p>Nowadays, generative artificial intelligence (GAI) drives medical education toward enhanced intelligence, personalization, and interactivity. With its vast generative abilities and diverse applications, GAI redefines how educational resources are accessed, teaching methods are implemented, and assessments are conducted.</p></sec><sec><title>Objective</title><p>This study aimed to review the current applications of GAI in medical education; analyze its opportunities and challenges; identify its strengths and potential issues in educational methods, assessments, and resources; and capture GAI&#x2019;s rapid evolution and multidimensional applications in medical education, thereby providing a theoretical foundation for future practice.</p></sec><sec sec-type="methods"><title>Methods</title><p>This scoping review used PubMed, Web of Science, and Scopus to analyze literature from January 2023 to October 2024, focusing on GAI applications in medical education. Following PRISMA-ScR (Preferred Reporting Items for Systematic Reviews and Meta-Analyses Extension for Scoping Reviews) guidelines, 5991 articles were retrieved, with 1304 duplicates removed. The 2-stage screening (title or abstract and full-text review) excluded 4564 articles and a supplementary search included 8 articles, yielding 131 studies for final synthesis. We included (1) studies addressing GAI&#x2019;s applications, challenges, or future directions in medical education, (2) empirical research, systematic reviews, and meta-analyses, and (3) English-language articles. We excluded commentaries, editorials, viewpoints, perspectives, short reports, or communications with low levels of evidence, non-GAI technologies, and studies centered on other fields of medical education (eg, nursing). We integrated quantitative analysis of publication trends and Human Development Index (HDI) with thematic analysis of applications, technical limitations, and ethical implications.</p></sec><sec sec-type="results"><title>Results</title><p>Analysis of 131 articles revealed that 74.0% (n=97) originated from countries or regions with very high HDI, with the United States contributing the most (n=33); 14.5% (n=19) were from high HDI countries, 5.3% (n=7) from medium HDI countries, and 2.2% (n=3) from low HDI countries, with 3.8% (n=5) involving cross-HDI collaborations. ChatGPT was the most studied GAI model (n=119), followed by Gemini (n=22), Copilot (n=11), Claude (n=6), and LLaMA (n=4). Thematic analysis indicated that GAI applications in medical education mainly embody the diversification of educational methods, scientific evaluation of educational assessments, and dynamic optimization of educational resources. However, it also highlighted current limitations and potential future challenges, including insufficient scene adaptability, data quality and information bias, overreliance, and ethical controversies.</p></sec><sec sec-type="conclusions"><title>Conclusion</title><p>GAI application in medical education exhibits significant regional disparities in development, and model research statistics reflect researchers&#x2019; certain usage preferences. GAI holds potential for empowering medical education, but widespread adoption requires overcoming complex technical and ethical challenges. Grounded in symbiotic agency theory, we advocate establishing the resource-method-assessment tripartite model, developing specialized models and constructing an integrated system of general large language models incorporating specialized ones, promoting resource sharing, refining ethical governance, and building an educational ecosystem fostering human-machine symbiosis, enabling deep tech-humanism integration and advancing medical education toward greater efficiency and human-centeredness.</p></sec></abstract><kwd-group><kwd>generative artificial intelligence</kwd><kwd>GAI</kwd><kwd>large language model</kwd><kwd>ChatGPT</kwd><kwd>medical education</kwd><kwd>human-machine symbiosis</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Background</title><p>The 21st century has seen accelerated advancement in information technology and artificial intelligence (AI), significantly altering lifestyles and work paradigms. With progress in deep learning and large-scale data processing, generative artificial intelligence (GAI) has emerged as an influential innovation. GAI rapidly expands into diverse applications, enabling content generation across text, images, and audio through the analysis of extensive datasets [<xref ref-type="bibr" rid="ref1">1</xref>]. Its market demonstrates notable growth, with a 2024 global valuation of ~US $16.8 billion and a projected 37.6% compound annual growth rate (CAGR) from 2025 to 2030 [<xref ref-type="bibr" rid="ref2">2</xref>], reflecting its significance in commercial and academic domains.</p><p>GAI&#x2019;s development is driven by advances in natural language processing (NLP), particularly the Transformer architecture, which enables the generation of complex content. Large language models (LLMs) serve as core technical implementations of GAI. Models like GPT-3, GPT-4, Copilot, and LLaMA 3 have expanded GAI applications from basic automation to sophisticated tasks including content creation, data analysis, and intelligent question-answering systems [<xref ref-type="bibr" rid="ref3">3</xref>]. These transformer-based LLMs exemplify how conceptual GAI frameworks are operationalized via model architectures and engineering practices.</p><p>With technological advancements, GAI has gradually infiltrated more specialized fields, with medical education a prime example. This domain faces challenges due to its knowledge-intensive and highly practical characteristics: traditional teaching methods struggle to replicate clinical scenarios efficiently, and increasingly scarce clinical teaching specimens and patient resources limit the clinical practice training of medical students, all of which are not conducive to the cultivation of medical talents with both clinical thinking and practical ability [<xref ref-type="bibr" rid="ref4">4</xref>]. In this content, GAI may empower medical education through its enhancement effects on 3 core educational elements: improving resource generation efficiency, optimizing the interactivity of pedagogical approaches, and enhancing the automation level of assessment processes [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. Nevertheless, the accompanying integration risks include potential biases and inaccuracies in generated content [<xref ref-type="bibr" rid="ref7">7</xref>] and possible inhibition of critical thinking through over-reliance [<xref ref-type="bibr" rid="ref8">8</xref>]. Thus, optimal implementation strategies warrant further investigation.</p><p>Current GAI integration in medical education involves rapid technological iteration and shifting research paradigms [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. Prior reviews exhibit three limitations: (L1) Overreliance on single-model analyses (predominantly ChatGPT) [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>], (L2) insufficient examination of geographical disparities in adoption patterns, and (L3) fragmented assessment of GAI&#x2019;s impact across 3 core dimensions of medical education. These dimensions include resources (teaching support materials like GAI-generated clinical cases and pathological images), methods (instructional strategies like adaptive learning pathways and simulated decision-making), and assessment (automated evaluation of learner performance, such as automated short-answer scoring). Crucially, studies before 2023 were constrained by the technology&#x2019;s maturity, missing the recent shift from theoretical exploration to operational implementation [<xref ref-type="bibr" rid="ref1">1</xref>]. Therefore, a new round of scoping review is urgently needed to focus on the critical evolution period between January 2023 and October, 2024 (before the completion of this scoping review), construct a multidimensional analytical framework (encompassing resources, methods, and assessment), and clarify the complex picture of the deep interaction between GAI and medical education. To guide this investigation, this study discusses the multifaceted landscape of GAI adoption in medical education through 3 interconnected lines of inquiry. First, it aims to examine whether regional disparities exist in GAI implementation and how researchers exhibit preferences for specific LLMs (eg, ChatGPT). We posit that adoption patterns will demonstrate significant stratification aligned with national development levels and reflect preferential usage of widely accessible general-purpose models. Second, it seeks to map the current state of GAI applications across educational resources, methods, and assessment dimensions. We hypothesize that effectiveness will vary substantially across these domains due to differences in technical implementation requirements and inherent task complexities. Third, it intends to identify current limitations and future challenges, positing that technical deficiencies, including ethical risks such as compromised academic integrity and data hallucinations, will constitute the most significant barriers to sustainable integration.</p></sec><sec id="s1-2"><title>Theoretical Framework</title><sec id="s1-2-1"><title>Theoretical Model: The Theory of Symbiotic Agency</title><p>Based on the theoretical framework of symbiotic agency [<xref ref-type="bibr" rid="ref11">11</xref>], a theory emphasizing interdependent and collaborative relationships between humans and technology, this study conceptualizes human-technology relations as a process of mutual constitution. Technology functions neither as a passive instrument dominated by humans nor as an autonomous replacement for human agency. Instead, it develops in tandem with humans through interdependent interactions: technology enhances human efficacy by expanding cognitive boundaries and enabling novel multimodal interactions, while humans legitimize technological practice by embedding ethical norms and conducting context-specific interpretations such as weighting clinical decisions. This symbiosis transcends traditional master-servant dichotomies by establishing a responsibility-sharing network. Within this network, technology acts as a co-agent in human activity systems, collectively enhancing capabilities rather than substituting human roles. This perspective provides the foundational understanding needed to maintain a dynamic balance in human-technology interdependence within medical education, forming the basis of our conceptual model.</p></sec><sec id="s1-2-2"><title>Conceptual Model 1: Specialized Models Integrated System Based on General Large Language Models</title><p>Building upon the analytical framework established in Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, which systematically compares general-purpose and domain-specialized GAI models across 3 critical dimensions (knowledge representation fidelity, task compatibility, and ethical constraint mechanisms), this study deconstructs technological heterogeneity to avoid conflating &#x201C;GAI&#x201D; as a homogeneous entity. The models in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> (see Table S1) were selected via multisource evidence synthesis, including peer-reviewed studies, industry reports (eg, Global Large Language Model (LLM) Market Research Report 2024) [<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref20">20</xref>], and empirical validation in educational contexts, based on four criteria: (1) technological representativeness of core advancements (multimodality, reasoning, and domain adaptation); (2) broad academic and practical relevance in medical education; (3) functional diversity covering text, image, video, and domain-specific tasks; and (4) market prevalence, wide recognition, technical maturity, and development by prominent AI companies. Notably, models like Perplexity, DeepSeek, Notebook LM, and Midjourney, though used by clinicians and students in specific scenarios, were not included due to limited evaluative data and insufficient supporting information in the referenced reports.</p><p>Within this ecosystem, general LLMs serve as multitasking hubs, leveraging cross-domain adaptability and natural language interaction, while specialized models achieve context-specific efficacy through the embedding of deep medical knowledge. To resolve their complementary yet fragmented coexistence, we propose a specialized model integration system anchored to general LLMs, inspired by symbiotic agency theory and hospital diagnostic workflows [<xref ref-type="bibr" rid="ref21">21</xref>] (see <xref ref-type="fig" rid="figure1">Figure 1</xref>). This architecture establishes a 3-tiered clinical analog: general LLMs serve as primary coordinators, managing task orchestration; specialized models act as domain experts, executing depth-specific processing; and protocol-based collaboration enables online consultation through knowledge distillation and output validation. This hierarchical integration embodies symbiotic agency principles: general models extend the applicability of specialized techniques by transcending domain boundaries, while specialized models enhance system depth by reinforcing medical logical rigor. Through functional complementarity and role differentiation, they form a synergistic symbiont exceeding individual capability limits, establishing an intelligent foundation for medical education characterized by adaptability, expertise, and reliability.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Specialized model integration system based on general large language models.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="mededu_v11i1e71125_fig01.png"/></fig></sec><sec id="s1-2-3"><title>Conceptual Model 2: Tripartite Synergistic Integration Model for Medical Education Resources, Methods, and Assessment</title><p>The tripartite synergy paradigm, rooted in complex systems management theory and evidenced across domains from political governance to integrated health care systems (eg, the mission alignment model by Peek et al [<xref ref-type="bibr" rid="ref22">22</xref>]), establishes our resource-method-assessment (RMA) framework (see <xref ref-type="fig" rid="figure2">Figure 2</xref>) as the core analytical structure [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. This framework defines three interdependent dimensions: (1) resources encompassing dynamic content provisioning mechanisms, (2) methods designing knowledge-to-practice training pathways, and (3) assessment managing outcome monitoring and feedback generation. Their cyclical optimization forms an integrated whole, as resource renewal enables pedagogical innovation, method implementation yields evaluative data, and assessment outputs drive resource refinement and method calibration. Within this architecture, GAI operates as a collaborative instrument executing content generation, interaction support, and data analysis under educator-directed goal design, ethical governance, and critical intervention. The established framework provides essential categorization criteria for subsequent empirical analysis: it defines 3 dimensions&#x2014;resources, methods, and assessment&#x2014;directly corresponding to 3 primary research domains in GAI applications for medical education. By consolidating fragmented literature within a unified analytical structure, this framework systematically addresses cognitive limitations arising from isolated examinations of technological functions, thereby elucidating the intrinsic operational logic of technology-enabled educational transformation.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>The model of integrated and collaborative development of medical education methods, resources, and assessment.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="mededu_v11i1e71125_fig02.png"/></fig></sec></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Review</title><p>With the rapid development of GAI, its applications in medical education have garnered considerable attention and have become a significant research focus. We conducted a preliminary search using the keyword combination of &#x201C;generative artificial intelligence&#x201D; and &#x201C;medical education&#x201D; across PubMed, Web of Science, and Scopus. Our goal was to analyze the publication trend regarding the applications and challenges of GAI in medical education over the past 5 years (from January 2020 to October 2024). The literature search was limited to sources published between January 2023 and October 2024 for the following reasons: (1) Technological progression: The 2023&#x2010;2024 period coincides with a shift from theoretical proposals (pre-2023) to empirical studies on GAI implementation in medical education. (2) Scope alignment: The review prioritizes analysis of current applications, identified limitations (eg, output inaccuracies and integrity concerns), and near-future developments rather than historical trends. (3) Avoiding redundancy: Pre-2023 literature is excluded to prevent overlap with existing syntheses and focus on emergent applications (eg, automated assessment and adaptive resources) evidenced in the sampled literature (n=131). (4) Practical relevance: This timeframe reflects consolidated evidence on operational challenges and benefits relevant to contemporary pedagogical decision-making.</p></sec><sec id="s2-2"><title>Search Strategy</title><p>We used Boolean operators to combine GAI and medical education keywords, creating the final search strategy (see <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). A thorough search was conducted across 3 major databases: PubMed, Web of Science, and Scopus, focusing only on English-language articles published from January 2023 to October 2024.</p></sec><sec id="s2-3"><title>Inclusion and Exclusion Criteria</title><p>This study included research articles focusing on the applications, challenges, and future development of GAI in medical education applications. Articles were excluded if they were commentaries, editorials, viewpoint, perspective, and short reports or communications with low level of evidence or did not discuss GAI within medical education. Studies focusing on non-GAI forms such as predictive analytics and natural language processing or those centered on other fields of medical education (eg, nursing) were also excluded. We excluded nursing based on fundamental educational differences. Clinical and dental education follow structured undergraduate curricula focused on acute care, diagnostics, and technical skills within hospital settings. Nursing emphasizes community practice, longitudinal relationships, and chronic disease management [<xref ref-type="bibr" rid="ref24">24</xref>]. Including nursing would introduce significant heterogeneity in learning outcomes, GAI applications, and educational contexts. This methodological exclusion preserves thematic coherence and internal validity for analyzing GAI&#x2019;s role in comparable, technology-driven medical education environments.</p><p>Initially, YL and ZL conducted a preliminary screening of titles and abstracts from 3 databases. With the help of Zotero 7.0.13 (64-bit), a document management software (it is a project of Digital Scholar and developed by a global community), ZL detected duplicates of the initially screened articles according to title, author, abstract, and other information and removed duplicates. Following this initial phase, YL and ZL independently reviewed the full texts for a second round of evaluation. In cases of disagreement, ZY and NZ were consulted to mediate and make the final determination regarding inclusion.</p></sec><sec id="s2-4"><title>Data Extraction Protocol</title><p>To ensure the systematicity, transparency, and reproducibility of this scoping review, a detailed data extraction protocol was developed and rigorously followed.</p><sec id="s2-4-1"><title>Data Point Definition and Protocol Development</title><p>Before comprehensive data extraction, a structured data extraction form was collaboratively developed by all authors. This iterative process was guided by our research questions and the predefined thematic framework outlined in <xref ref-type="table" rid="table1">Table 1</xref>, which focused on the applications, challenges, and prospects of GAI in medical education applications. The form was designed to systematically capture key information from each included article, encompassing: bibliographic details (eg, authors, publication year, journal, and country or region), study characteristics (eg, research design, objectives, and population), specific GAI models used (eg, ChatGPT [OpenAI] and Gemini [Google]), application scope (single-model vs multimodel), analysis type (performance comparison across models or examination of synergistic enhancement through model integration)<bold>,</bold> detailed descriptions of identified applications, challenges, and future directions of GAI application in medical education categorized exclusively through our tripartite Trinity Framework and quantitative performance metrics (reported accuracy rates, percentages, mean scores, standard deviations, and <italic>P</italic> values related to GAI model performance in various tasks). This granular definition of data points ensured that all relevant information pertinent to our broad research inquiry was systematically collected.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>A systematic thematic analysis of applications and challenges of generative artificial intelligence (GAI) in medical education.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom" colspan="2">Category and theme</td><td align="left" valign="bottom">Subtheme</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="2">Medical educational assessment</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Scoring short answers automatically.</td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Evaluating articles.</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top" colspan="2">Medical educational resources</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Providing standard answers.</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>The performance of different question types.</p></list-item><list-item><p>The performance of different difficulty questions.</p></list-item><list-item><p>The performance of questions at different cognitive levels.</p></list-item></list></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Generating diverse clinical cases.</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Digital interaction and communication training.</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Sharing educational resources.</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Generating clinical images.</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top" colspan="2">Medical educational methods</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Curriculum design.</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Generating customized teaching aids.</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Generating explanations for MCQ<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup>.</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Personalized learning support.</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Medical decision aid.</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Multidisciplinary knowledge acquisition.</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Academic writing optimization.</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top" colspan="2">Existing defects at this stage</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Insufficient scene adaptability.</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Poor ability to handle complex clinical scenarios.</p></list-item><list-item><p>Lack of local background in specific regions.</p></list-item><list-item><p>Language adaptability issues.</p></list-item><list-item><p>Lack of nontextual information analysis skills.</p></list-item></list></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Data quality and information bias</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Hallucination phenomena.</p></list-item><list-item><p>Lack of details on output content.</p></list-item><list-item><p>Lack of personalization.</p></list-item><list-item><p>Dataset dependency.</p></list-item></list></td></tr><tr><td align="left" valign="top" colspan="2">Potential issues in the future</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Overreliance</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Impaired critical thinking.</p></list-item><list-item><p>Decreased creativity.</p></list-item><list-item><p>Decreased teamwork ability.</p></list-item><list-item><p>Decreased practical problem-solving ability.</p></list-item></list></td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Ethical controversy</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Authenticity of the test results.</p></list-item><list-item><p>Academic misconduct.</p></list-item><list-item><p>Lack of clinical interaction and emotional resonance.</p></list-item><list-item><p>Resource inequality.</p></list-item><list-item><p>Ownership of intellectual property rights.</p></list-item><list-item><p>&#x201C;Black box&#x201D; problem and attribution of responsibility.</p></list-item></list></td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>Not available.</p></fn><fn id="table1fn2"><p><sup>b</sup>MCQ: multiple choice question.</p></fn></table-wrap-foot></table-wrap><p>To better understand the global research landscape in this field, we analyzed the countries or regions of origin for the 131 selected articles. For those without a precise location, we assigned them according to the country or region of the corresponding author&#x2019;s institution. To analyze the distribution of research based on the countries or region&#x2019;s development level, we used the Human Development Index (HDI) classification. The latest HDI data categorizes countries or regions into 4 tiers: very high, high, medium, and low human development with higher HDI scores correlating with greater national development. We also investigated cross-level HDI collaborations, which refer to partnerships between countries from different HDI categories [<xref ref-type="bibr" rid="ref25">25</xref>].</p></sec><sec id="s2-4-2"><title>Protocol Testing and Quality Control</title><p>To validate the comprehensiveness and clarity of the data extraction form, a pilot test was independently conducted by 2 reviewers, YL and ZL, on a randomly selected subset of 10 included articles. During this pilot phase, any discrepancies in data extraction or ambiguities within the form were identified and discussed. Based on these discussions, the data extraction form underwent iterative revisions to refine categories, clarify definitions, and ensure consistent interpretation of data points among reviewers. Following this refinement, YL and ZL independently extracted data from all 131 included articles. In cases of disagreement between the 2 independent extractors, consensus was initially sought through discussion. If a consensus could not be reached, a third and fourth reviewer, ZY and NZ, were consulted to mediate and make final determinations regarding the applicability and extraction of the data.</p></sec></sec><sec id="s2-5"><title>Synthesis of Results</title><p>ZY subsequently compiled and reorganized the extracted data, assigning new identifiers for easier reference. This organized dataset was then categorized according to the predefined themes and subthemes (see <xref ref-type="table" rid="table1">Table 1</xref>), forming the basis for the subsequent descriptive summary and analysis. Our analysis employed a theory-driven, top-down approach anchored in a tripartite conceptual model of medical education: resource generation, method innovation, and assessment upgrade. The following sections will present a descriptive summary of the extracted data.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Overview</title><p>Following our search strategy, we retrieved 5991 articles, of which 1304 were duplicates, leaving 4687 articles. In the first round of screening, 4006 irrelevant articles were excluded based on titles and abstracts, leaving 681 articles. In the second round, we excluded 558 articles after full-text review, including 278 nonmedical education articles, 195 non-GAI articles, 18 focused on other medical fields (eg, nursing), and 67 of different types (eg, commentaries). During the paper preparation, we conducted a supplementary search for 8 systematic reviews and meta-analyses. Ultimately, 131 articles were included in the final review (see <xref ref-type="fig" rid="figure3">Figure 3</xref>). Among the 131 included studies, the distribution of research designs was as follows: 83 cross-sectional studies, 5 randomized controlled trials (RCTs), 2 quasi-experimental studies, 1 cohort study, 1 quasi-randomized controlled trial, 8 systematic reviews and meta-analyses, 5 mixed-methods studies, and 1 case study. The remaining 25 studies were categorized as &#x201C;other&#x201D; with nonstandardized research designs, which were not fitting typical epidemiological or evidence-based medicine classifications. Collectively, cross-sectional studies (descriptive research designs) constituted the majority (n=83), reflecting the emerging state of GAI in medical education, where most research focuses on initial application explorations, feasibility assessments, and user experience descriptions rather than hypothesis-driven experimental designs. Other study types, including RCTs, cohort studies, and systematic reviews, provided supplementary evidence on intervention effects, longitudinal trends, and synthesized findings, respectively.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Article screening flow chart. AI: artificial intelligence.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="mededu_v11i1e71125_fig03.png"/></fig></sec><sec id="s3-2"><title>Analysis of Literature Source and Human Development Levels</title><p>Based on the countries or regions of origin for the included articles and HDI classification, we analyzed the distribution of related studies. The results are illustrated in <xref ref-type="table" rid="table2">Table 2</xref> and <xref ref-type="fig" rid="figure4">Figure 4</xref>. A significant portion (74%, n=97 articles) of the research came from countries or regions with very high human development, with the United States contributing 33 studies. High human development countries or regions produced 15% (n=19 articles), with China contributing 13 studies. Medium human development countries or regions contributed 5% (n=7 articles), mainly from India, while low human development countries or regions accounted for only 2% (n=3 articles). Furthermore, 4% of the studies (n=5 articles) involved cross-level collaborations, primarily between very high and medium or low HDI countries or regions.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Distribution of countries or regions of origin for generative artificial intelligence (GAI) research in medical education (categorized by the HDI<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup>).</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">HDI classification</td><td align="left" valign="bottom">Portion, n (%)</td></tr></thead><tbody><tr><td align="left" valign="top">Very high human development</td><td align="left" valign="top">97 (74.0)</td></tr><tr><td align="left" valign="top">High human development</td><td align="left" valign="top">19 (14.5)</td></tr><tr><td align="left" valign="top">Medium human development</td><td align="left" valign="top">7 (5.3)</td></tr><tr><td align="left" valign="top">Low human development</td><td align="left" valign="top">3 (2.2)</td></tr><tr><td align="left" valign="top">Cross-level HDI collaboration</td><td align="left" valign="top">5 (3.8)</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>HDI: Human Development Index.</p></fn></table-wrap-foot></table-wrap><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Geographical distribution of countries or regions of origin for generative artificial intelligence (GAI) research in medical education.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="mededu_v11i1e71125_fig04.png"/></fig></sec><sec id="s3-3"><title>Applications of GAI in Medical Education</title><sec id="s3-3-1"><title>Medical Educational Assessment</title><sec id="s3-3-1-1"><title>Scoring Short Answers Automatically</title><p>A recent study examined GPT-4 (OpenAI) and Gemini 1.0 Pro in automated short answer grading using 2288 student responses from 12 undergraduate medical courses across 3 languages, with instructor-provided rubrics or sample solutions as reference standards. GPT-4 showed high precision (0.91) in identifying fully correct answers, though its scores were significantly lower than human graders, while Gemini 1.0 Pro had no significant difference from human evaluations, with a mean normalized score of 0.68 (SD 0.32) and median of 0.75, similar to humans. Both models demonstrated high consistency across repeated evaluations, especially with high-quality standard responses, and these findings are specific to undergraduate medical education contexts [<xref ref-type="bibr" rid="ref26">26</xref>].</p></sec><sec id="s3-3-1-2"><title>Evaluating Articles</title><p>Liu et al [<xref ref-type="bibr" rid="ref27">27</xref>] reported that in their study of 50 rehabilitation-related original articles, 50 sections (introductions, discussions, and conclusions) were generated by ChatGPT-3.5 and 50 were corresponding AI-rephrased versions using Wordtune Originality.ai, achieved 100% accuracy in detecting both AI-generated and AI-rephrased content. ZeroGPT correctly identified 96% of AI-generated texts and 88% of rephrased ones. The study focused specifically on rehabilitation medicine with analyzed content limited to partial article sections rather than full texts. It is notable that such high detection rates have not been widely observed across other disciplines or with newer large language model versions. The specialized nature of medical writing, including technical terminology use, may also influence these outcomes in ways not seen in broader academic contexts, which should be considered when evaluating the generalizability of these findings. Another study comparing automatic scoring systems (ChatGPT-3.5 and ChatGPT-4) with manual scoring for article quality assessment found no significant difference between GPT-4-based scoring and human grading. This demonstrates the considerable potential of GAI to enhance the quality evaluation of articles [<xref ref-type="bibr" rid="ref28">28</xref>].</p></sec></sec></sec><sec id="s3-4"><title>Medical Educational Resources</title><sec id="s3-4-1"><title>Providing Standard Answers</title><p>The performance of different question types: The studies encompassed a range of question types, including multiple-choice questions (MCQs), single-choice questions, short-answer questions (SAQs), true or false questions, open-ended short-answer questions (SOAQs), long-answer questions, clinical case analysis questions (CAQs), and image-text integrated questions [<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref37">37</xref>]. An exploratory study conducted by a research team from Qatar University evaluated ChatGPT&#x2019;s performance across various assessment formats relevant to undergraduate dental education. The study included 50 assessment items covering 50 different learning outcomes, with 10 items for each of the 5 formats: MCQs, SAQs, short essay questions (SEQs), single true or false questions, and fill-in-the-blank items. These items were based on core clinical topics in dental education, such as restorative dentistry, periodontics, endodontics, and oral surgery, aligned with the learning outcomes expected of undergraduate dental students. In this study, ChatGPT demonstrated 90% accuracy for SAQs, SEQs, and fill-in-the-blank items and notably achieved 100% accuracy in single true or false questions [<xref ref-type="bibr" rid="ref31">31</xref>]. However, other studies have revealed a significant decline in accuracy for CAQs, as low as 17%, which require strong logical reasoning and lack predefined options [<xref ref-type="bibr" rid="ref34">34</xref>].</p><p>Regarding MCQs, a study reported that GPT-4 and Microsoft Bing achieved top scores (76%) on the University of Antwerp medical licensing MCQ exam, outperforming medical students. However, ChatGPT&#x2019;s accuracy fell considerably when tackling Chinese-language medical MCQs with an accuracy of 37%. In addition, another study reported that in the Chinese Master&#x2019;s Degree Entrance Examination, ChatGPT&#x2019;s accuracy for single-choice questions (A1 type) was 56%, whereas for MCQs, it dropped to 33% [<xref ref-type="bibr" rid="ref15">15</xref>]. These findings suggest that GAI&#x2019;s performance is not uniformly robust across all MCQ types and is influenced by factors such as question structure, subject domain, difficulty, language, and the presence of clinical vignettes or images.</p><p>The performance of different difficulty questions: In terms of difficulty, questions were generally classified as &#x201C;easy,&#x201D; &#x201C;medium,&#x201D; or &#x201C;difficult.&#x201D; For example, the difficulty levels are defined based on the performance indicators of the historical question bank: &#x201C;Difficult&#x201D; (<italic>P</italic>&#x003C;.30; less than 30% of the students answered correctly), &#x201C;Medium&#x201D; (<italic>P</italic>=.30 to .80), and &#x201C;Easy&#x201D; (<italic>P</italic>&#x003E;.80) [<xref ref-type="bibr" rid="ref35">35</xref>]. ChatGPT-4 demonstrated strong performance on easy questions, with accuracy rates reaching 97.4%. Yet, even in this category, ChatGPT-4&#x2019;s performance lagged behind that of residents [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref38">38</xref>-<xref ref-type="bibr" rid="ref42">42</xref>]. In contrast, ChatGPT-4 excelled on medium and difficult questions, outperforming residents by 25.4 and 24.4 percentage points, respectively [<xref ref-type="bibr" rid="ref38">38</xref>]. Across all models, performance tended to decline with increased difficulty, especially for higher-level questions that required multistep reasoning, where accuracy dropped markedly [<xref ref-type="bibr" rid="ref39">39</xref>-<xref ref-type="bibr" rid="ref45">45</xref>].</p><p>The performance of questions at different cognitive levels: 2 studies investigated the performance of ChatGPT-4 on questions categorized by Bloom&#x2019;s taxonomy, which includes 6 cognitive levels: remembering, understanding, applying, analyzing, evaluating, and creating [<xref ref-type="bibr" rid="ref46">46</xref>]. These studies found that ChatGPT-4 consistently performed well across all cognitive levels, with an average correct answer rate of 71.96% for each cognitive level [<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref48">48</xref>].</p></sec><sec id="s3-4-2"><title>Generating Diverse Clinical Cases</title><p>By collaborating with instructors, GAI can quickly generate comprehensive clinical cases, including patient history, physical examination results, lab data, and differential diagnoses tailored to predefined learning objectives (eg, chest pain and joint pain). This reduces the time instructors spend developing such cases [<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>]. Furthermore, GAI-generated cases can integrate various contextual factors such as race, occupation, and lifestyle, significantly enriching the diversity of teaching materials [<xref ref-type="bibr" rid="ref51">51</xref>]. For example, when creating a case based on a disease profile specific to a region, the ethnicity of the generated patient can be adjusted accordingly. In the context of type 2 diabetes, modifications can be made to the age range and weight distribution. In addition, randomized prompts for urine analysis may be included in urinary tract infection cases. Both patient presentations and examination findings can be randomized, and symptom expression can be customized to meet specific learning needs [<xref ref-type="bibr" rid="ref51">51</xref>].</p><p>In Smith and colleagues&#x2019; [<xref ref-type="bibr" rid="ref52">52</xref>] study, GAI was assigned the task of creating a case of an immigrant with mental health concerns, as this group may require specialized social psychiatry interventions. The results indicated that GAI was able to produce a case that met fundamental educational objectives. However, it included several signs of emotional disorders, highlighting a need for further refinement.</p></sec><sec id="s3-4-3"><title>Digital Interaction and Communication Training</title><p>Studies have shown that GAI is effective in promoting interactive learning and providing practice in communication skills. GAI-powered simulation tools simulate changes in clinical conditions in scenarios such as advanced cardiac life support (ACLS) and intensive care unit (ICU) sepsis, prompting students to critically analyze whether their decisions are correct [<xref ref-type="bibr" rid="ref53">53</xref>]. In addition, conversational GAI-created digital patients provide anesthetists with valuable training for patient interactions, reducing reliance on human actors while enhancing the flexibility and consistency of the training process [<xref ref-type="bibr" rid="ref54">54</xref>]. These digital interactions create a safe space for repeated practice, providing dynamic learning experiences that traditional textbooks cannot match [<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref55">55</xref>]. Furthermore, conversational GAI models, such as chatbots, can simulate the role of a professor, offering critical evaluations of literature and distilling complex research into easily understandable key findings, thus fostering simulated discussions between students and experts in the field [<xref ref-type="bibr" rid="ref56">56</xref>]. However, besides experiences and qualitative observations, formal evaluations of the reliability and validity of such GAI-generated information in a professor-like capacity are still needed.</p></sec><sec id="s3-4-4"><title>Sharing Educational Resources</title><p>By generating accessible public health information, GAI enhances the public&#x2019;s understanding of essential health issues, such as infectious disease prevention and vaccination, ultimately leading to improved health literacy [<xref ref-type="bibr" rid="ref30">30</xref>]. Furthermore, GAI-generated clinical cases can be disseminated as Open Educational Resources (OERs), providing medical educators with globally adaptable teaching materials that are customized to local contexts [<xref ref-type="bibr" rid="ref51">51</xref>].</p></sec><sec id="s3-4-5"><title>Generating Clinical Images</title><p>GAI tools such as Adobe Firefly, DALL&#x00B7;E 2 (OpenAI), Bing Image Creator, and generative adversarial networks (GANs) can create clinical images displaying various pathological features based on textual descriptions, potentially addressing the shortage of authentic pathological images in traditional medical education due to medical confidentiality and patient privacy restrictions [<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref57">57</xref>-<xref ref-type="bibr" rid="ref59">59</xref>]. For instance, images of retinal disease generated by the stable diffusion model enhance students&#x2019; learning opportunities in ophthalmic pathology, greatly enhancing the availability of visual teaching resources [<xref ref-type="bibr" rid="ref57">57</xref>]. However, their reliability and accuracy vary significantly across models and tasks. For example, DALL&#x00B7;E 2 demonstrated an overall clinical accuracy rate of 22.2% in aligning generated images with textual prompts across 15 semantic relations (eg, spatial and action-based relationships), with only 3 relationships (touching, helping, and kicking) achieving moderate consistency above 25%. In a medical education context, DALL&#x00B7;E 2 achieved 78% accuracy for soft-tissue tumor images but produced inconsistent results for wound images, with 65% of generated wound images containing anatomical inaccuracies or irrelevant elements [<xref ref-type="bibr" rid="ref58">58</xref>]. A comparative study of DALL&#x00B7;E 2, Midjourney, and Blue Willow for generating skin ulcer images showed DALL&#x00B7;E 2 performed best with an average score of 3.2/5 (scale 1&#x2010;5) but still produced irrelevant content (eg, X-rays instead of pressure ulcers) in 20% of cases. Midjourney generated stylized, exaggerated features in 40% of images, while Blue Willow produced images with little relevance to prompts in 70% of attempts [<xref ref-type="bibr" rid="ref59">59</xref>].</p></sec></sec><sec id="s3-5"><title>Medical Educational Methods</title><sec id="s3-5-1"><title>Curriculum Design</title><p>GAI shows potential in the early stages of curriculum development, aiding in quickly creating course objectives, learning strategies, and frameworks. For instance, in a study on integrated pharmacotherapy of infectious disease education modules, ChatGPT helped design curriculum goals (eg, &#x201C;describe mechanisms of antibiotic resistance&#x201D;) with an average expert rating of 92% for appropriateness and accuracy, supporting educators&#x2014;especially in designing foundational courses [<xref ref-type="bibr" rid="ref60">60</xref>].</p></sec><sec id="s3-5-2"><title>Generating Customized Teaching Aids</title><p>Researchers have developed derivative applications based on classical models, such as Glass AI (a powerful AI-driven knowledge management system developed by Glass Health, focusing on organizing and retrieving health-related information efficiently). It integrates GPT-4 with evidence-based, peer-reviewed clinical guidelines to generate differential diagnoses and clinical plans based on textual input of clinical cases, enabling students to interact with it and experience the GAI-driven diagnostic process for cases [<xref ref-type="bibr" rid="ref61">61</xref>]. Similarly, an MCQ generator based on ChatGPT-generated cases offers a dynamic platform for personalized learning assessments [<xref ref-type="bibr" rid="ref62">62</xref>].</p></sec><sec id="s3-5-3"><title>Generating Explanations for Multiple-Choice Questions</title><p>Research shows that when GAI is used to answer MCQs, the explanations generated by GAI can better convey key knowledge points and achieve good accuracy and degree of matching with teachers&#x2019; explanations. Of the 81 questions explained by the teacher and correctly answered by ChatGPT, 92.6% of the explanations were accurate and included at least part of the teacher&#x2019;s explanation. However, the research also highlights that if an initial response is incorrect, the likelihood of subsequent errors increases significantly (<italic>P</italic>&#x003C;.001), indicating that an early mistake may lead to systematic inaccuracies in later explanations [<xref ref-type="bibr" rid="ref63">63</xref>]. Complementing this, in a systematic review, the broader literature reviewed showed that the majority of studies (5/8, 62.5%) indicate the effectiveness of AI in generating valid MCQs, with a preference for the latest GPT-4 models (6/8, 75%) [<xref ref-type="bibr" rid="ref64">64</xref>].</p></sec><sec id="s3-5-4"><title>Personalized Learning Support</title><p>Studies demonstrate that GAI boosts students&#x2019; learning efficiency across multiple stages by offering personalized feedback and customized content. This includes support for exam preparation [<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref65">65</xref>-<xref ref-type="bibr" rid="ref68">68</xref>], optimizing learning paths and review strategies [<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref69">69</xref>-<xref ref-type="bibr" rid="ref71">71</xref>], clarifying medical concepts [<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref72">72</xref>-<xref ref-type="bibr" rid="ref76">76</xref>], and assisting in the development of tailored career plans [<xref ref-type="bibr" rid="ref77">77</xref>]. For instance, in physiological case analysis, GAI offers precise responses and contextually relevant feedback. A cross-sectional study tested 77 physiology case vignettes (covering diverse physiological and pathophysiological scenarios, designed for undergraduates) on ChatGPT 3.5, Google Bard, and Microsoft Bing. Rated by two physiologists on a 0&#x2010;4 scale, ChatGPT scored highest at 3.19 (SD 0.3), outperforming Bard (2.91, SD 0.5) and Bing (2.15, SD 0.6) with <italic>P</italic>&#x003C;.001. ChatGPT&#x2019;s precision accelerates task completion, helping students grasp medical knowledge in practical scenarios more effectively [<xref ref-type="bibr" rid="ref78">78</xref>]. Furthermore, a study found that in cases of initial incorrect responses, GPT-4 was able to self-correct and provide accurate answers after simple follow-up questions or hints, mimicking pedagogical interactions observed in residency programs. This dynamic learning approach, coupled with rapid information processing, positions GPT-4 as an important asset for personalized learning [<xref ref-type="bibr" rid="ref79">79</xref>].</p></sec><sec id="s3-5-5"><title>Medical Decision Aid</title><p>GAI uses its ability to analyze complex, domain-specific knowledge to support the diagnosis of rare and intricate diseases. In addition to diagnosis, it can generate differential diagnoses tailored to the unique characteristics of each disease, providing health care professionals with precise decision-making support [<xref ref-type="bibr" rid="ref80">80</xref>-<xref ref-type="bibr" rid="ref83">83</xref>]. For common pathological issues and basic data analysis, GAI tools are efficient and accurate, helping pathologists organize their thought processes and expedite the initial diagnostic phases [<xref ref-type="bibr" rid="ref84">84</xref>]. The impact of domain-specific training is profound. For instance, refined datasets in the surgical and anesthesiology fields enhance GAI&#x2019;s clinical decision-making capabilities. In scenarios such as a &#x201C;30-year-old pregnant woman requiring an emergency appendectomy,&#x201D; GAI suggests not only tailored surgical strategies but also factors in critical anesthesia protocols [<xref ref-type="bibr" rid="ref85">85</xref>]. Furthermore, in the field of traditional Chinese medicine, when combined with such tools, GAI can effectively create knowledge maps that organize entities, attributes, and their relationships to traditional Chinese medicine through graphical structures. GAI provides unique support for teaching traditional Chinese medicine and disease diagnosis and treatment decisions [<xref ref-type="bibr" rid="ref86">86</xref>].</p></sec><sec id="s3-5-6"><title>Multidisciplinary Knowledge Acquisition</title><p>GAI demonstrates potential in multidisciplinary knowledge acquisition within medical education by providing high-quality knowledge across various medical subfields [<xref ref-type="bibr" rid="ref87">87</xref>-<xref ref-type="bibr" rid="ref94">94</xref>]. GAI demonstrates adaptability across disciplines, including shoulder and elbow surgery, sports medicine, and oncology [<xref ref-type="bibr" rid="ref91">91</xref>]. Research further indicates that GAI models such as ChatGPT-4 excel in internal medicine, pediatrics, obstetrics and gynecology, surgery, emergency care, and public health [<xref ref-type="bibr" rid="ref88">88</xref>-<xref ref-type="bibr" rid="ref90">90</xref>,<xref ref-type="bibr" rid="ref92">92</xref>-<xref ref-type="bibr" rid="ref94">94</xref>]. Notably, a study assessing ChatGPT-4&#x2019;s performance in the American Board of Family Medicine (ABFM) certification examination demonstrated its significant proficiency, with both the custom robot version (embedded in a specialized subenvironment designed to mimic examination conditions and given extensive preparation resources) and the regular version (standard ChatGPT-4) achieving high correct response rates of 88.67% and 87.33% respectively, well above the passing threshold. This further highlights GAI&#x2019;s value in enhancing medical education within a multidisciplinary framework, making it a powerful learning support tool across a wide range of fields, including family medicine [<xref ref-type="bibr" rid="ref95">95</xref>]. A meta-analysis of ChatGPT-3.5/4 across medical, pharmacy, dentistry, and nursing licensing exams revealed an overall accuracy of 70.1% (95% CI 65%&#x2010;74.8%; <italic>P</italic>&#x003C;.001). Performance varied significantly by field (Q=15.334; <italic>P</italic>=.002), with pharmacy having the highest rate (71.5%, 95% CI 66.3%&#x2010;76.2%) and nursing having the lowest rate (61.8%, 95% CI 58.7%&#x2010;64.9%). These results demonstrate GAI&#x2019;s potential to provide multidisciplinary learning support in health professions [<xref ref-type="bibr" rid="ref96">96</xref>]. It is crucial to note that the evidence presented in this section highlights the individual learner&#x2019;s ability to access and comprehend information across disciplines. This review&#x2019;s existing evidence has not yet extensively covered GAI&#x2019;s direct support for complex interdisciplinary teamwork, closed-loop communication, or the cultivation of specific professional behaviors within collaborative learning environments.</p></sec><sec id="s3-5-7"><title>Academic Writing Optimization</title><p>A study shows that GAI excels in creating article outlines and editing formatting, which alleviates common writing challenges related to poor organization and grammatical mistakes [<xref ref-type="bibr" rid="ref28">28</xref>]. In addition, GAI can significantly improve the quality and standardization of academic writing, allowing medical educators and students to express their ideas more accurately and clearly [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref97">97</xref>]. Furthermore, GAI assists students in organizing and generating literature content while writing their thesis [<xref ref-type="bibr" rid="ref98">98</xref>]. The content produced by GAI maintains consistency in language and includes appropriate academic terminology and logical structure, helping students present themselves more professionally in their academic writing [<xref ref-type="bibr" rid="ref55">55</xref>]. Furthermore, GAI supports many non-native English speakers in overcoming language barriers during the academic writing process, which enables them to engage more confidently in academic communication [<xref ref-type="bibr" rid="ref71">71</xref>].</p></sec></sec><sec id="s3-6"><title>Statistical Analysis of the Application of GAI Models</title><p>The models discussed in 131 articles include ChatGPT, Gemini (formerly known as Bard), Copilot (formerly known as Bing), Claude, and LLaMA, as well as other types of models such as StyleGAN2-ADA, Stable Diffusion, and customized chatbots.</p><p>Among the various models studied, ChatGPT stands out due to its advanced natural language processing capabilities. Of the 131 articles, 119 (89.5%) focused on ChatGPT, which was applied in diverse educational contexts, including simulating doctor-patient conversations, generating exam questions, and providing personalized learning support. These applications highlight their flexibility and adaptability in medical education. Notably, research had shown that as versions have iterated, ChatGPT-4 has significantly improved in both performance and scope compared to ChatGPT-3.5 [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref94">94</xref>,<xref ref-type="bibr" rid="ref99">99</xref>-<xref ref-type="bibr" rid="ref101">101</xref>].</p><p>Gemini was mentioned in 22 articles, accounting for 16.5% of the total. Copilot was mentioned in 11 articles, primarily due to its integration with the Microsoft ecosystem, making it ideal for educational management and resource development. Claude was cited in 6 articles. LLaMA, referenced in 4 articles, stands out for its ability to run locally, making it suitable for environments with limited resources. In addition, StyleGAN2-ADA, Stable Diffusion, and Convai were discussed in individual studies, mainly for their use in image generation and visualizing doctor-patient interactions.</p><p>The performance assessment of two or more models was compared in 26 articles. In comparative studies within the articles, numerous models have undergone head-to-head research, including ChatGPT-4 with Gemini 1.0 Pro [<xref ref-type="bibr" rid="ref26">26</xref>], ChatGPT-4 with ChatGPT-3.5 [<xref ref-type="bibr" rid="ref96">96</xref>], ChatGPT 3.5 with Google Bard and Microsoft Bing [<xref ref-type="bibr" rid="ref78">78</xref>], DALL-E 2 with Midjourney and Blue Willow [<xref ref-type="bibr" rid="ref59">59</xref>], and Originality.ai with ZeroGPT [<xref ref-type="bibr" rid="ref27">27</xref>]. Based on these head-to-head investigations, different models demonstrate proficiency in specific tasks: ChatGPT-4 performs better in handling complex tasks, providing accurate medical knowledge, generating exam questions, and offering personalized learning support, especially in English-language medical licensing examinations; Gemini 1.0 Pro is noted for its strong contextual understanding and multimodal capabilities; ChatGPT-3.5 excels in simulating doctor-patient conversations, generating exam questions, and providing personalized learning support; Microsoft Bing achieved top scores alongside GPT-4 in medical licensing MCQ exams; DALL-E 2 shows potential in creating clinical images with specific pathological features from textual descriptions; and Originality.ai achieves high accuracy in detecting both AI-generated and AI-rephrased medical writing.</p></sec><sec id="s3-7"><title>Challenges of GAI in Medical Education</title><sec id="s3-7-1"><title>Existing Defects at This Stage</title><sec id="s3-7-1-1"><title>Insufficient Scene Adaptability</title><p>Insufficient scene adaptability is due to the following factors.</p><p>First is the poor ability to handle complex clinical scenarios. GAI faces substantial limitations when handling complex clinical scenarios, particularly in cases requiring multistep reasoning, intricate calculations, and recognition of atypical clinical symptoms [<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref87">87</xref>,<xref ref-type="bibr" rid="ref102">102</xref>,<xref ref-type="bibr" rid="ref103">103</xref>]. For instance, studies have shown that GAI struggles with MCQs, X-type problems, and tasks demanding deep reasoning. This underscores its limited ability to perform the nuanced decision-making required in medical judgments [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref84">84</xref>,<xref ref-type="bibr" rid="ref89">89</xref>-<xref ref-type="bibr" rid="ref92">92</xref>,<xref ref-type="bibr" rid="ref104">104</xref>-<xref ref-type="bibr" rid="ref107">107</xref>]. Furthermore, GAI-generated clinical scenarios often lack flexibility and fail to replicate the diversity and complexity of real-life clinical environments, thereby limiting learners&#x2019; exposure to the spectrum of challenging cases [<xref ref-type="bibr" rid="ref108">108</xref>,<xref ref-type="bibr" rid="ref109">109</xref>]. GAI also faces technical limitations in generating simulated images for complex diseases, resulting in images that fail to depict atypical manifestations accurately [<xref ref-type="bibr" rid="ref57">57</xref>]. Furthermore, GAI models demonstrate uneven knowledge depth, exemplified by an ophthalmology meta-analysis: accuracy was 78% in &#x201C;Pathology&#x201D; but significantly lower in foundational or clinical areas, such as &#x201C;Ophthalmology fundamentals&#x201D; (52%), &#x201C;Clinical ophthalmology&#x201D; (57%), and &#x201C;Refractive surgery&#x201D; (59%) [<xref ref-type="bibr" rid="ref110">110</xref>].</p><p>Second is the lack of local background in specific regions. Numerous studies have shown that GAI often struggles to adapt effectively to a specific region&#x2019;s unique background and needs when dealing with medical content related to that region, thereby undermining its universal applicability in multicultural settings [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref102">102</xref>,<xref ref-type="bibr" rid="ref111">111</xref>]. For example, ChatGPT often responds to public health issues in India with a Western-centric perspective, overlooking local situations and cultural differences [<xref ref-type="bibr" rid="ref33">33</xref>]. Similarly, ChatGPT struggles to accurately comprehend and adapt to the local regulatory environment when addressing medical policies specific to China, largely due to the limited representation of Chinese data in its training set [<xref ref-type="bibr" rid="ref102">102</xref>,<xref ref-type="bibr" rid="ref112">112</xref>].</p><p>Third is language adaptability issues. Currently, GAI exhibits significant limitations in processing languages, particularly in non-English medical education environments. The accuracy of GAI models like ChatGPT often varies greatly when handling languages such as Chinese, Korean, and Polish, resulting in incorrect outcomes in these contexts [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref106">106</xref>,<xref ref-type="bibr" rid="ref113">113</xref>-<xref ref-type="bibr" rid="ref115">115</xref>]. A meta-analysis quantified disparity: GPT-3.5 achieved 57% accuracy (95% CI 52%&#x2010;62%; <italic>P</italic>&#x003C;.01) in English-speaking countries and 58% (95% CI 52%&#x2010;64%; <italic>P</italic>&#x003C;.01) in non-English-speaking countries (<italic>P</italic>=.72). GPT-4 scored 86% (95% CI 82%&#x2010;89%; <italic>P</italic>&#x003C;0.01) in English-speaking countries versus 80% (95% CI 76%&#x2010;83%; <italic>P</italic>&#x003C;.01) in non-English-speaking countries (<italic>P</italic>=.02), demonstrating the adaptability issues of GAI models across different linguistic and regional contexts [<xref ref-type="bibr" rid="ref116">116</xref>].</p><p>Fourth is a lack of nontextual information analysis skills. Current GAI tools like ChatGPT and Bard struggle to handle image-based queries, limiting their application in fields such as dentistry, neurosurgery, and nuclear medicine, where visual analysis of images and tissue samples is crucial for clinical decision-making [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref73">73</xref>-<xref ref-type="bibr" rid="ref75">75</xref>,<xref ref-type="bibr" rid="ref117">117</xref>].</p></sec><sec id="s3-7-1-2"><title>Data Quality and Information Bias</title><p>Data quality issues and information bias occur due to the following factors.</p><p>First is the hallucination phenomenon. In GAI applications, hallucinations occur when the content generated by GAI diverges from factual accuracy or contradicts itself, remaining a prevalent issue. In total, 3 primary types of hallucinations have been identified: input-conflicting hallucination, context-conflicting hallucination, and fact-conflicting hallucination. Input-conflicting hallucination occurs when the GAI-generated content contradicts the initial information provided by the user. This can mislead learners and hinder their understanding of specific concepts [<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref118">118</xref>]. Context-conflicting hallucination arises when the GAI offers contradictory responses to the same or similar questions. This inconsistency is particularly evident in complex case analyses [<xref ref-type="bibr" rid="ref71">71</xref>,<xref ref-type="bibr" rid="ref90">90</xref>,<xref ref-type="bibr" rid="ref119">119</xref>,<xref ref-type="bibr" rid="ref120">120</xref>]. Fact-conflicting hallucination occurs when the GAI reports facts that contradict established information, often with a high confidence level, which can easily mislead learners [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref121">121</xref>-<xref ref-type="bibr" rid="ref137">137</xref>].</p><p>Second is the lack of details on output content. Numerous studies have highlighted that GAI often generates overly simplified or vague responses, lacking essential details and knowledge necessary for a comprehensive understanding [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref73">73</xref>,<xref ref-type="bibr" rid="ref114">114</xref>,<xref ref-type="bibr" rid="ref118">118</xref>,<xref ref-type="bibr" rid="ref120">120</xref>,<xref ref-type="bibr" rid="ref135">135</xref>,<xref ref-type="bibr" rid="ref136">136</xref>,<xref ref-type="bibr" rid="ref138">138</xref>,<xref ref-type="bibr" rid="ref139">139</xref>]. For instance, evaluations of GAI in cardiology have revealed that it fails to specify the types of heart murmurs associated with valve diseases. In addition, GAI-generated descriptions of pathophysiology and epidemiology tend to be overly general, often including vague statements such as &#x201C;certain age groups are at higher risk&#x201D; without specifying the specific conditions. Furthermore, GAI often produces incomplete or inaccurate information when generating case study materials, which can lead to misleading students. For example, GAI-generated learning materials on melanoma have been known to omit crucial tumor markers like S-100 or the latest treatment for BRAF (B-Raf proto-oncogene, serine, or threonine kinase) mutations [<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref138">138</xref>]. The same problems are evident in academic writing assistance, where GAI may create basic article structures but often lacks the depth, detail, and critical citations found in human-generated content [<xref ref-type="bibr" rid="ref120">120</xref>].</p><p>Third is the lack of personalization. The content generated by GAI lacks personalization tailored to individual needs. This limitation mainly manifests in the generated text, which often adopts similar writing patterns and standardized language, struggling to incorporate personalized perspectives or creative expressions [<xref ref-type="bibr" rid="ref28">28</xref>]. In a medical environment, GAI-generated treatment plans, although generally reasonable, often fail to consider individual patient characteristics, such as the severity of the disease, lifestyle, and personal preferences [<xref ref-type="bibr" rid="ref105">105</xref>].</p><p>Fourth is dataset dependency. The performance of GAI is significantly influenced by the quality and diversity of its training data. If the data is insufficient or skewed, it may lead to potential biases and limitations in practical applications, causing underperformance in less-represented areas [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref73">73</xref>,<xref ref-type="bibr" rid="ref82">82</xref>,<xref ref-type="bibr" rid="ref85">85</xref>,<xref ref-type="bibr" rid="ref86">86</xref>,<xref ref-type="bibr" rid="ref111">111</xref>,<xref ref-type="bibr" rid="ref117">117</xref>,<xref ref-type="bibr" rid="ref122">122</xref>,<xref ref-type="bibr" rid="ref126">126</xref>,<xref ref-type="bibr" rid="ref140">140</xref>-<xref ref-type="bibr" rid="ref143">143</xref>]. In addition, the cutoff date for the training data means that GAI may lack knowledge of the latest research, leading to outdated or inaccurate recommendations [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref74">74</xref>,<xref ref-type="bibr" rid="ref80">80</xref>,<xref ref-type="bibr" rid="ref89">89</xref>,<xref ref-type="bibr" rid="ref92">92</xref>,<xref ref-type="bibr" rid="ref94">94</xref>,<xref ref-type="bibr" rid="ref109">109</xref>,<xref ref-type="bibr" rid="ref129">129</xref>,<xref ref-type="bibr" rid="ref136">136</xref>,<xref ref-type="bibr" rid="ref141">141</xref>,<xref ref-type="bibr" rid="ref144">144</xref>]. For example, when advising on treatment for bipolar disorder in pregnant women, ChatGPT-4 failed to incorporate the latest studies and instead suggested outdated methods [<xref ref-type="bibr" rid="ref89">89</xref>]. Furthermore, the data bias present in GAI during the training process cannot be overlooked [<xref ref-type="bibr" rid="ref51">51</xref>-<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref71">71</xref>,<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref78">78</xref>,<xref ref-type="bibr" rid="ref107">107</xref>,<xref ref-type="bibr" rid="ref108">108</xref>,<xref ref-type="bibr" rid="ref132">132</xref>,<xref ref-type="bibr" rid="ref139">139</xref>,<xref ref-type="bibr" rid="ref145">145</xref>]. Such biases often arise from the intrinsic imbalances within the dataset, which subsequently permeate the generated content. These biases manifest as stereotypes, mainly depicting certain professions or physical attributes. For instance, some occupations may be associated with higher BMIs, while the French ethnicity is stereotypically linked to the profession of &#x201C;wine connoisseur&#x201D; [<xref ref-type="bibr" rid="ref51">51</xref>].</p></sec></sec></sec><sec id="s3-8"><title>Potential Issues in the Future</title><sec id="s3-8-1"><title>Overreliance</title><p>Overreliance can be caused due to the following factors.</p><p>First is impaired critical thinking. The rapid feedback provided by GAI may reduce students&#x2019; time for deep thinking, weakening their ability to analyze problems and independently engage in critical learning. This phenomenon is particularly evident in medical education, where students often rely on the answers provided by GAI when solving complex problems rather than relying on their logical reasoning and knowledge accumulation for analysis and resolution [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref74">74</xref>,<xref ref-type="bibr" rid="ref75">75</xref>,<xref ref-type="bibr" rid="ref77">77</xref>,<xref ref-type="bibr" rid="ref98">98</xref>,<xref ref-type="bibr" rid="ref99">99</xref>,<xref ref-type="bibr" rid="ref124">124</xref>,<xref ref-type="bibr" rid="ref136">136</xref>,<xref ref-type="bibr" rid="ref146">146</xref>-<xref ref-type="bibr" rid="ref152">152</xref>].</p><p>Second is decreased creativity. When students use GAI tools like ChatGPT, they often receive writing suggestions that lack the creativity and depth of human-generated content. Thus, prolonged reliance on such tools may weaken their independent writing skills and hinder their ability to engage with complex topics that require critical thinking and practical expertise [<xref ref-type="bibr" rid="ref28">28</xref>]. Similarly, educators who overly depend on GAI for content creation may stifle their curricular innovation, limit diversity and depth in teaching materials, and ultimately diminish the overall quality of education [<xref ref-type="bibr" rid="ref60">60</xref>].</p><p>Third is decreased teamwork ability. Overreliance on GAI tools such as ChatGPT can weaken students&#x2019; communication skills and ability to engage actively in collaborative teamwork [<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref152">152</xref>]. Furthermore, the frequent use of these tools limits opportunities for meaningful interpersonal interaction with peers and mentors, hindering the development of essential teamwork and communication skills [<xref ref-type="bibr" rid="ref152">152</xref>].</p><p>Fourth is decreased practical problem-solving ability. Practical problem-solving is essential for clinical decision-making and patient management. However, the convenience of GAI tools may lead students to rely on preexisting solutions, neglecting the deeper analysis and logical reasoning necessary to develop personalized answers [<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref74">74</xref>,<xref ref-type="bibr" rid="ref75">75</xref>,<xref ref-type="bibr" rid="ref77">77</xref>,<xref ref-type="bibr" rid="ref87">87</xref>,<xref ref-type="bibr" rid="ref151">151</xref>-<xref ref-type="bibr" rid="ref153">153</xref>]. Furthermore, using these tools may reduce interaction with mentors and peers, limiting students&#x2019; opportunities to gain diverse perspectives through collaborative discussions and approach problems from multiple angles [<xref ref-type="bibr" rid="ref147">147</xref>].</p></sec><sec id="s3-8-2"><title>Ethical Controversy</title><p>Ethical controversies can occur due to the following factors.</p><p>First is the authenticity of the test results, as the integration of GAI in testing and assessment may compromise the accuracy and effectiveness of traditional methods used to evaluate students&#x2019; actual capabilities. GAI-generated responses or GAI-assisted evaluations risk reflecting the performance of GAI itself rather than students&#x2019; authentic abilities. This issue is evident in various exams, such as medical licensing and specialty exams, presenting new ethical challenges in medical education [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref78">78</xref>,<xref ref-type="bibr" rid="ref99">99</xref>,<xref ref-type="bibr" rid="ref144">144</xref>,<xref ref-type="bibr" rid="ref146">146</xref>,<xref ref-type="bibr" rid="ref154">154</xref>].</p><p>Second is academic misconduct, since GAI-generated content often evades traditional plagiarism detection tools, making it easier for students to exploit GAI tools to complete assignments or write papers without being detected, thus jeopardizing academic integrity [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref154">154</xref>]. In addition, the ease of using GAI to generate answers cultivates students&#x2019; mindset of overreliance on such tools for academic tasks, which may increase their future likelihood of academic misconduct [<xref ref-type="bibr" rid="ref70">70</xref>-<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref124">124</xref>,<xref ref-type="bibr" rid="ref155">155</xref>]. This issue extends beyond individual students and poses a broader threat to academic ethics, as GAI-generated content can be misinterpreted as original work, distorting academic evaluations [<xref ref-type="bibr" rid="ref125">125</xref>,<xref ref-type="bibr" rid="ref150">150</xref>].</p><p>Third is a lack of clinical interaction and emotional resonance. When addressing complex ethical or emotional medical issues, GAI lacks the empathy and emotional responsiveness inherent in human physicians, potentially undermining trust in the doctor-patient relationship [<xref ref-type="bibr" rid="ref98">98</xref>,<xref ref-type="bibr" rid="ref131">131</xref>]. This limitation is supported by a General Medicine In-Training Examination (GM-ITE) study comparing GPT-4 and Japanese residents. In the GM-ITE, &#x201C;medical interview and professionalism&#x201D; category assesses patient communication, ethics, and professionalism. It uses scenario-based questions (eg, addressing a terminally ill patient&#x2019;s anxiety or resolving treatment ethics). Responses are scored 0&#x2010;10 based on communication appropriateness, empathy depth, and ethical application, with top marks for nuanced, human-centric judgment. Notably, GPT-4 scored 8.6 points lower here than residents [<xref ref-type="bibr" rid="ref38">38</xref>]. Furthermore, because GAI tools do not provide an authentic, interactive experience or situational awareness, they may struggle to simulate the behavior and reactions of real patients accurately. This limitation makes it challenging for students to fully appreciate the importance of empathy and its application in doctor-patient interactions, which affects their development of communication and empathy skills development [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref76">76</xref>,<xref ref-type="bibr" rid="ref77">77</xref>,<xref ref-type="bibr" rid="ref101">101</xref>,<xref ref-type="bibr" rid="ref107">107</xref>,<xref ref-type="bibr" rid="ref147">147</xref>,<xref ref-type="bibr" rid="ref152">152</xref>].</p><p>Fourth is resource inequality, which is most evident in the unequal access to technology and data. Datasets used for training GAI often exhibit biases, particularly involving data from different racial or socioeconomic backgrounds. This can worsen existing health care disparities. Furthermore, developing high-quality LLMs requires substantial computational resources, creating significant access barriers, especially for educational institutions or students with limited financial means. Hence, subscription fees and hardware limitations restrict their access to these GAI tools [<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref74">74</xref>,<xref ref-type="bibr" rid="ref85">85</xref>,<xref ref-type="bibr" rid="ref134">134</xref>].</p><p>Fifth is the ownership of intellectual property rights. The widespread use of GAI in medical education raises numerous intellectual property concerns, particularly regarding copyright disputes related to the medical data used during AI training [<xref ref-type="bibr" rid="ref113">113</xref>]. In addition, the legal status of GAI-generated content remains unclear, as current copyright laws do not adequately address the ownership of GAI-generated images and texts. This leaves the ownership of such content unclear, complicating the determination of whether the rights belong to the user, the developer, or other stakeholders [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref124">124</xref>].</p><p>Sixth is the &#x201C;black box&#x201D; problem and the attribution of responsibility. The application of GAI in medical education faces a significant challenge known as the &#x201C;black box&#x201D; problem. This issue arises from the lack of transparency and interpretability of GAI models, which directly affects the safety and reliability of these applications in medical settings. This lack of transparency makes it hard to understand how GAI reaches specific conclusions, especially when results are erroneous or biased, complicating efforts to trace and correct mistakes [<xref ref-type="bibr" rid="ref86">86</xref>,<xref ref-type="bibr" rid="ref88">88</xref>,<xref ref-type="bibr" rid="ref148">148</xref>]. Furthermore, when GAI is used for diagnostic or clinical decision support, any errors or biases in its generated results can make it difficult to establish accountability. Trust in the doctor-patient relationship is built on clear responsibility. However, the lack of transparency in GAI models undermines this trust, leaving patients and physicians uncertain about the safety and reliability of GAI-driven decisions [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref114">114</xref>].</p></sec></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>This scoping review systematically identifies 3 core characteristics of GAI in medical education through an analysis of 131 included studies: pronounced regional disparities, empowerment potential via RMA synergy, and unresolved technical and ethical challenges. These findings must be contextualized within the field&#x2019;s evolving landscape: Our initial screening retrieved 5991 articles, a striking number reflecting both the opportunities and challenges of this emerging domain. This vast volume can be attributed to GAI&#x2019;s rapid evolution as a nascent technology, where relevant concepts remain loosely defined and inconsistent. Consequently, keyword usage lacks standardization, often resulting in the inclusion of tangentially related cross-disciplinary studies. Furthermore, GAI&#x2019;s inherently interdisciplinary nature broadens the scope of relevant literature. While this abundance highlights widespread interest and diverse applications, it also emphasizes the lack of conceptual clarity and consistency in frameworks. Therefore, although research is progressing, the field remains in a transitional stage, moving from &#x201C;conceptual standardization&#x201D; to &#x201C;unified frameworks.&#x201D; To propel the field forward, the academic community needs to reach a consensus on GAI-related definitions and application structures. Achieving this standardization will enable better tracking of emerging trends and facilitate the effective use of new insights.</p><p>Against this backdrop, regional distribution analysis reveals marked concentration of GAI research in very high HDI regions (74%), with minimal contributions from low-HDI regions (2%) and scarce cross-regional collaborations (4%), highlighting structural inequities in global technology diffusion. Model use patterns further demonstrate ChatGPT&#x2019;s dominant adoption (89.5%), driven by its superior performance in multifaceted educational tasks: (1) iterative version advancements (eg, GPT-4&#x2019;s significant improvements in reasoning accuracy and error reduction over GPT-3.5); (2) proven efficacy across diverse applications including clinical simulation, exam question generation, and personalized tutoring; and (3) robust multilingual support despite variability in non-English contexts. This technical versatility explains its preferential adoption by researchers. The disproportionately high usage rate of general LLMs over specialized models, coupled with a predominant focus on cross-model comparisons rather than synergistic integration, reflects insufficient exploration of technical adaptability and system interoperability within current research.</p><p>Within the RMA tripartite framework established in this study, GAI reshapes medical education through coordinated optimization across 3 dimensions. In resource provisioning, it effectively mitigates traditional constraints of specimen scarcity and privacy limitations through the efficient generation of diverse clinical cases and pathological images. Methodologically, it facilitates the transition from standardized instruction to personalized education through interdisciplinary knowledge integration and targeted learning support. For assessment, high concordance in automated scoring and academic integrity monitoring provides scalable solutions for educational quality assurance. This closed-loop optimization mechanism, which encompasses resource allocation, pedagogical implementation, and evaluative feedback, validates the framework&#x2019;s explanatory power for technology-enabled educational transformation.</p><p>Nevertheless, profound barriers impede deeper GAI integration. Current technical deficiencies manifest as: inadequate contextual adaptation (eg, limitations in complex clinical reasoning and MCQ processing), data quality flaws (including hallucinatory outputs and deficient nontextual information analysis), and linguistic or regional biases (particularly performance degradation in non-English contexts). Long-term risks include erosion of critical thinking and creativity due to overreliance, alongside ethical governance dilemmas that encompass ambiguous accountability, inequitable resource distribution, and deficient clinician-patient emotional engagement. These dual challenges constitute fundamental barriers to implementing human-AI collaboration paradigms.</p></sec><sec id="s4-2"><title>Comparison With Existing Literature</title><p>This scoping review specifically focuses on the period between January 2023 and October 2024, a critical transitional phase where GAI in medical education shifted from theoretical exploration to practical implementation. By capturing this transformative era, it addresses the gap in previous reviews [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref9">9</xref>] that lacked coverage of the latest advancements. While building on the foundational insights of earlier studies, this review extends their scope by identifying emerging trends and practical applications that have emerged with GAI&#x2019;s maturation in educational contexts.</p><p>Our observation of pronounced regional disparities starkly aligns with and quantifies the well-documented &#x201C;digital divide&#x201D; prevalent in global health technology diffusion [<xref ref-type="bibr" rid="ref156">156</xref>]. However, this study provides concrete, GAI-specific evidence within medical education, highlighting the extreme concentration and the critical scarcity of cross-tier collaboration, thereby reinforcing concerns about equity in accessing transformative educational technologies and potentially exacerbating global health workforce inequities.</p><p>Regarding model use, the overwhelming dominance of ChatGPT mirrors its widespread popularity in GAI application studies [<xref ref-type="bibr" rid="ref157">157</xref>]. Yet, our analysis delves deeper than mere prevalence reports or bibliometric study [<xref ref-type="bibr" rid="ref158">158</xref>-<xref ref-type="bibr" rid="ref160">160</xref>], specifically attributing this dominance to its rapid iteration (eg, GPT-4&#x2019;s improvements), proven versatility across key educational tasks (clinical sim, QG, and tutoring), and relatively robust (though imperfect) multilingual support, which are crucial for adoption in the diverse contexts of medical education research.</p><p>Our development of the RMA tripartite framework represents a key theoretical departure. While existing research acknowledges GAI&#x2019;s impact on discrete educational facets (resource provision, teaching methodologies, and evaluative processes), a unifying framework that binds these elements into a synergistic, closed-loop optimization mechanism is conspicuously absent from the current discourse [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. Such a framework uniquely conceptualizes these three dimensions as an interdependent, dynamic closed-loop system essential for understanding GAI&#x2019;s holistic transformative potential. Crucially, the empirical identification of significant RMA imbalance (robust exploration of educational methods and resources vs sparse focus on learner assessment) does not imply that assessment is under-prioritized in education broadly, but rather reflects a current skew in GAI-medical education integration&#x2014;with research disproportionately focusing on resource enrichment and methodological optimization, while lagging in the development of learner assessment applications [<xref ref-type="bibr" rid="ref161">161</xref>]. This imbalance, viewed through our novel integrative lens, offers a structured diagnostic for the systemic gap in aligning GAI capabilities with the specific needs of learner assessment within medical education.</p><p>The unresolved technical-ethical challenges documented (eg, contextual limitations, hallucinations, biases, erosion of critical thinking, and concerns about empathy) resonate strongly with growing critiques of LLMs in healthcare [<xref ref-type="bibr" rid="ref162">162</xref>,<xref ref-type="bibr" rid="ref163">163</xref>]. Our review explicitly maps these well-recognized limitations onto the sensitive context of medical education, highlighting their manifestation and potential impact in shaping future clinicians. This reinforces concerns raised elsewhere but grounds them firmly in the educational domain.</p><p>Another distinctive contribution of this review lies in revealing a critical technological imbalance: the overwhelming focus on general-purpose LLMs like ChatGPT contrasts sharply with the lack of systematic development of specialized medical models and the near absence of research on multimodel collaborative mechanisms within medical education [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref164">164</xref>]. This finding highlights a gap in the current technological approach, which hinders depth and clinical authenticity. While previous studies used available tools, our synthesis highlights this specific limitation as a barrier to deeper integration.</p></sec><sec id="s4-3"><title>Implications of the Findings</title><sec id="s4-3-1"><title>Implications for Educational Practice</title><p>This study makes a key contribution to pedagogical practice by establishing the RMA tripartite framework and revealing its developmental imbalances, thereby providing a practical paradigm for the integration of GAI into medical education. The core value of this framework lies in elucidating the dynamic closed-loop nature of technology-enhanced education, wherein resource provision establishes the pedagogical foundation, methodological innovation activates knowledge transformation, and assessment feedback drives systemic evolution; these 3 components constitute an interlocking educational mechanism [<xref ref-type="bibr" rid="ref165">165</xref>].</p><p>As evidenced in the results section, the current imbalance, characterized by rich exploration in GAI-supported educational resources and teaching methods yet relatively limited progress in GAI-driven automated evaluation of learner performance, stems from an overemphasis on short-term efficiency in early technology adoption. This has led to systemic neglect of assessment&#x2019;s role as an optimization tool. For example, GAI is widely used to generate diverse clinical cases and pathological images to enrich educational resources and design adaptive learning pathways to innovate teaching methods. However, in learner assessment, most GAI tools still rely on simple automated scoring of knowledge-based quizzes, with few leveraging GAI to evaluate higher-order competencies such as clinical reasoning or diagnostic accuracy [<xref ref-type="bibr" rid="ref26">26</xref>]. Another instance is that many researchers use GAI to create interactive simulation scenarios as a methodological advancement but fail to integrate automated assessment features that track learners&#x2019; decision-making processes in these scenarios [<xref ref-type="bibr" rid="ref53">53</xref>]. This misses opportunities to use assessment data to refine the scenarios themselves. Overreliance on GAI for resource and method innovation without matching progress in automated learner assessment risks disconnecting what is taught or provided from what learners need to master, ultimately limiting GAI&#x2019;s ability to drive meaningful change in medical education.</p><p>Achieving optimal integration requires establishing a bidirectional enhancement cycle centered on assessment. Automated assessment data capturing learning bottlenecks should guide the real-time expansion of clinical case libraries&#x2019; pathological spectra and difficulty calibration [<xref ref-type="bibr" rid="ref166">166</xref>], shifting resource provision from one-size-fits-all to demand responsiveness. Simultaneously, the focus on core competencies (such as clinical reasoning and problem-solving) emphasized in teaching methods must be integrated into new assessment dimensions [<xref ref-type="bibr" rid="ref167">167</xref>], driving teaching methods to evolve from mere knowledge transmission to competency development. Within this cycle, assessment functions not merely as a quality monitoring tool, but as the central nexus for the co-evolution of resources and methods.</p><p>Realizing this vision necessitates educators reconceptualizing operational logic [<xref ref-type="bibr" rid="ref165">165</xref>]. This involves using assessment data to inform the development of educational resources, specifically leveraging insights into learners&#x2019; knowledge gaps and skill deficiencies to dynamically adjust the complexity of clinical cases [<xref ref-type="bibr" rid="ref168">168</xref>], embedding real-time, practical, and contextual feedback mechanisms within high-order teaching activities like simulated diagnostics to optimize pedagogical strategies [<xref ref-type="bibr" rid="ref169">169</xref>], and establishing adaptive rules enabling cross-dimensional interaction to facilitate systemic iteration [<xref ref-type="bibr" rid="ref170">170</xref>,<xref ref-type="bibr" rid="ref171">171</xref>]. Collectively, this structural transformation elevates the tripartite framework into an organic educational operating system.</p><p>However, technological integration inherently presents dual challenges, highlighting the importance of upholding core principles of human-AI collaboration. Generating educational resources without clinical context review risks reinforcing data biases [<xref ref-type="bibr" rid="ref172">172</xref>]; methodological innovation overly reliant on algorithmic decisions may erode critical thinking [<xref ref-type="bibr" rid="ref9">9</xref>]; and automated assessment replacing human judgment may overlook students&#x2019; psychological needs, reducing course engagement and well-being scores [<xref ref-type="bibr" rid="ref173">173</xref>]. These manifestations of technological alienation arise from the partial ceding of human agency. Resolution lies in upholding a human-AI symbiotic vision: recognizing GAI as a collaborator, not a replacement, in educational evolution. Specifically at the resource layer, clinicians and educators must oversee the development of educational resources (eg, clinical cases) to balance efficiency, ethics, and clinical authenticity [<xref ref-type="bibr" rid="ref174">174</xref>,<xref ref-type="bibr" rid="ref175">175</xref>]. At the method layer, educators should direct learning path design to integrate technological augmentation with pedagogical wisdom [<xref ref-type="bibr" rid="ref176">176</xref>]. At the assessment layer, institutions should implement verification systems that combine human evaluation with machine automation, ensuring assessments balance efficiency with humanistic dimensions [<xref ref-type="bibr" rid="ref173">173</xref>,<xref ref-type="bibr" rid="ref177">177</xref>]. This reconfiguration of responsibilities positions technology as a tool and reaffirms human stewardship of education.</p></sec><sec id="s4-3-2"><title>Implications for Technological Development</title><p>This study identifies a technological imbalance in the application of GAI within medical education. This imbalance is characterized by the dominance of large general language models, while the development of specialized models for specific medical disciplines has lacked systematic progress. This limitation restricts the depth of technology-enabled education and indicates a neglect of multimodel collaborative mechanisms within current research paradigms.</p><p>The study proposes an integrated system using general LLMs alongside specialized medical models, employing a hierarchical collaborative architecture to reshape the technological ecosystem of medical education. The core operational logic establishes a 3-tiered functional division: general models act as the central hub for teaching interactions, handling basic task parsing and process orchestration; medical specialized models, drawing on vertical domain knowledge bases, execute high-complexity core teaching tasks such as clinical reasoning and medical image generation; and a cross-model validation mechanism forms a closed-loop quality control system. This architecture adapts the hospital&#x2019;s multidisciplinary team approach to AI in education, aligning technological capabilities with the requirements of medical education for expertise, reliability, and contextual authenticity.</p><p>Within medical education, this integrated system can facilitate 3 key changes. First, it addresses limitations in specialized knowledge depth inherent in traditional general models, improving training efficacy for advanced clinical reasoning. Second, it leverages GAI&#x2019;s multimodal capabilities, which integrate text and image data, to address key issues in medical imaging education including shortages of teaching resources like rare pathological images and the limits of static materials in showing dynamic anatomical relationships. This support helps evolve pathology visualization from static atlases to interactive 3D simulations, letting students explore spatial structures and pathological changes more intuitively [<xref ref-type="bibr" rid="ref178">178</xref>]. Third, it establishes a cross-model knowledge validation chain to automatically identify and correct typical logical inconsistencies and factual errors in general models, ensuring the academic rigor of teaching content. These changes collectively represent a paradigm shift from tool-assisted learning to intelligent teaching partnership systems [<xref ref-type="bibr" rid="ref179">179</xref>].</p><p>Supporting the effective operation of this system requires targeted solutions to key technical challenges. The primary task involves developing specialized models with medical context adaptive capabilities, specifically enhancing their semantic parsing of unstructured clinical texts to address performance variability in complex case analysis [<xref ref-type="bibr" rid="ref180">180</xref>,<xref ref-type="bibr" rid="ref181">181</xref>]. Concurrently, it is necessary to construct dynamically evolving medical education datasets that incorporate cross-regional case spectra and multilingual clinical literature to systematically mitigate cultural biases and time-lag effects in training data [<xref ref-type="bibr" rid="ref182">182</xref>]. Integrating privacy-preserving computation techniques like federated learning can enable secure data collaboration among institutions, continuously optimizing model localization and adaptation while safeguarding patient information security [<xref ref-type="bibr" rid="ref183">183</xref>,<xref ref-type="bibr" rid="ref184">184</xref>].</p></sec><sec id="s4-3-3"><title>Implications for Policies and Governance</title><p>This study reveals a pronounced regional disparity in the application of GAI within the field of medical education. Specifically, regions with a very high HDI dominate research output in this domain, while contributions from the low-HDI areas account for only 2%. The scarcity of cross-tier collaboration between very high- and low-HDI areas further exacerbates this structural inequity in resource distribution. This imbalance epitomizes systemic inequalities within global knowledge production systems, rooted in 3 compounding barriers: inadequate computational infrastructure in resource-constrained settings impedes technological localization, proprietary restrictions on core models under patent regimes limit feasible technology transfer, and excessive reliance on clinical data from high-income countries compromises model adaptability to regional health care priorities. Without deliberate intervention, this self-reinforcing Matthew Effect cycle risks intensifying the global fragmentation of medical educational resources [<xref ref-type="bibr" rid="ref185">185</xref>].</p><p>Addressing this complex challenge necessitates a multitiered governance framework. At the international level, binding technology-sharing agreements should request that holders of advanced models provide architectural access under fair-use principles, emphasizing the need to balance innovation with equitable access, while emulating open-source paradigms as a reference model [<xref ref-type="bibr" rid="ref186">186</xref>]. Concurrently, the World Health Organization could coordinate multinational efforts to develop nonprofit medical corpora incorporating disease spectra prevalent in low-HDI regions, such as tropical and endemic diseases [<xref ref-type="bibr" rid="ref187">187</xref>]. Nationally, ministries of education should integrate computational infrastructure into public medical education budgets [<xref ref-type="bibr" rid="ref188">188</xref>] and similar to the Medical Education Partnership Initiative (MEPI) [<xref ref-type="bibr" rid="ref189">189</xref>], establish dedicated funds for cross-border institutional partnerships to co-develop localized pedagogical tools that address specific regional educational needs. Institutionally, medical schools should adopt algorithmic transparency protocols, requiring deployed GAI tools to provide auditable model documentation that details the demographics and geographical coverage of training data. Fairness assessments of these tools should be carried out by multidisciplinary committees, which include clinicians, ethicists, and community representatives [<xref ref-type="bibr" rid="ref190">190</xref>].</p><p>Simultaneously, institutional responses must address secondary risks through integrated technical, educational, and regulatory safeguards. To counter academic misconduct, educational institutions should implement dual-track verification systems that require GAI-assisted submissions to be accompanied by generation logs and validated through detection tools [<xref ref-type="bibr" rid="ref191">191</xref>]. Academic journals must establish clear authorship standards declaring proportional human-GAI contributions [<xref ref-type="bibr" rid="ref192">192</xref>]. Mitigating critical thinking erosion requires curriculum committees to incorporate GAI-free clinical reasoning assessments, such as on-site case analyses evaluating independent diagnostic and management planning capabilities as prerequisites for professional certification [<xref ref-type="bibr" rid="ref193">193</xref>].</p><p>Technical deficiencies demand targeted interventions. Reducing model hallucinations requires dynamic fact-checking systems linking GAI outputs to authoritative medical knowledge bases, with confidence levels displayed during teaching platform usage [<xref ref-type="bibr" rid="ref194">194</xref>]. To address the opacity of algorithms, where the process by which GAI models derive conclusions remains unclear, it is necessary to document the diagnostic reasoning processes of these models. Such documentation allows instructors to review the reasoning, helps determine accountability when inconsistencies occur, and can be integrated into resident training evaluations to strengthen oversight of GAI-assisted decision-making [<xref ref-type="bibr" rid="ref195">195</xref>].</p><p>Fundamentally, governance paradigms must transition from a technocentric approach to symbiotic development. Compared to the commonly used &#x201C;human in the loop&#x201D; [<xref ref-type="bibr" rid="ref196">196</xref>], which mainly emphasizes humans overseeing or making final decisions in AI systems, symbiotic agency theory goes further: it highlights mutual shaping between humans and AI. Humans guide AI development through ethical norms and clinical experience, while AI enhances human capabilities by expanding cognitive boundaries, forming a dynamic, mutually reinforcing relationship [<xref ref-type="bibr" rid="ref11">11</xref>]. Policies should affirm human primacy in medical education, exemplified by reserving clinical empathy training exclusively for human instructors while limiting GAI to standardized case supplementation. An effective return to the essence of symbiotic agency means building collaborative mechanisms as shown in <xref ref-type="fig" rid="figure5">Figure 5</xref>: educators lead in setting teaching goals and ensuring ethical alignment (eg, reviewing GAI-generated cases to match real clinical logic); GAI supports personalized learning; students provide feedback to refine GAI tools; and policies clarify rights and responsibilities in this interaction. This human-centered approach ensures technological advancement aligns with pedagogical integrity and global equity imperatives.</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Vision of human-machine symbiosis: a schematic diagram. GAI: generative artificial intelligence.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="mededu_v11i1e71125_fig05.png"/></fig></sec></sec><sec id="s4-4"><title>Limitations and Future Direction</title><p>This scoping review has several limitations that should be acknowledged. First, the rapidly evolving nature of GAI means our findings primarily reflect the landscape captured up to the search date; newer models and applications emerging subsequently may shift current patterns. Second, the inherent conceptual breadth and interdisciplinary nature of GAI pose challenges for exhaustive literature capture, potentially leading to omissions despite broad search parameters. Third, and most critically, while this study proposes 3 key conceptual frameworks (the RMA tripartite model, the hierarchical collaborative architecture, and the symbiotic agency principle) and argues for their feasibility based on synthesized evidence, it has not empirically tested their implementation or efficacy in authentic educational settings. Finally, reliance on published literature may underrepresent real-world implementation challenges and grassroots innovations.</p><p>Future research must bridge this critical gap by translating these frameworks into practice. Priority should be given to: (1) implementing and evaluating the RMA balancing strategies and the integrated system combining general and specialized medical GAI models in specific medical education contexts to assess their impact on learning outcomes and operational feasibility; (2) conducting longitudinal studies to track the dynamic evolution of GAI integration over time, observing its long-term empowerment effects on educational processes and outcomes; and (3) operationalizing the symbiotic agency framework to guide the design, deployment, and assessment of these interventions. This framework is essential for ensuring that human-AI collaboration in practice genuinely augments educator and learner agency, fosters critical competencies, and upholds pedagogical integrity, thereby realizing the envisioned synergistic educational ecosystem.</p></sec><sec id="s4-5"><title>Conclusion</title><p>The application of GAI in medical education exhibits significant regional inequities, reflecting structural disparities in technological diffusion. Statistical findings from the model research reflect that researchers have certain preferences in its usage. The emergence of GAI has revitalized medical education, which is manifested in its promotion of the diversification of educational methods, the scientific evaluation of education assessment, and the dynamic optimization of education resources. However, these innovations are accompanied by current limitations and potential future challenges. By establishing the RMA tripartite model as a dynamic closed-loop system for educational optimization, proposing an integrated multimodel architecture to reconcile general and specialized GAI capabilities, and advancing the symbiotic agency principle to safeguard human primacy, this study provides foundational frameworks for navigating GAI integration. These contributions collectively address critical gaps in conceptual standardization and collaborative design, while delineating actionable pathways for pedagogical innovation, equitable technology development, and governance reform, which ultimately steer the field toward responsible human-AI collaboration that enhances clinical education without compromising pedagogical integrity or global equity.</p></sec></sec></body><back><ack><p>This study was financially supported by the Funding of Medical Science and Technology Research in Guangdong Province, China (A2023363), the Industry-University-Research Collaborative Education Program of Ministry of Education, China (230905518284433), and the Teaching Reform Research Project of Clinical Teaching Base in Guangdong Province, China (2023-30).</p></ack><notes><sec><title>Data Availability</title><p>The datasets generated during and analyzed during this study are available from the corresponding author on reasonable request.</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization: YL, ZL</p><p/><p>Methodology: YL, ZL</p><p/><p>Formal analysis: YL, ZL, ZY, NZ</p><p/><p>Investigation: YL, ZL, ZY, NZ</p><p/><p>Data curation: ZY, NZ</p><p/><p>Writing &#x2013; original draft: YL, ZL</p><p/><p>Writing &#x2013; review &#x0026; editing: YC, ZC, XL</p><p/><p>Visualization: ZY, NZ</p><p/><p>Supervision: L Zhao, L Zhang</p><p/><p>Project administration: L Zhao, L Zhang</p><p>Resources: YC, ZC, XL</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">GAI</term><def><p>generative artificial intelligence</p></def></def-item><def-item><term id="abb3">HDI</term><def><p>Human Development Index</p></def></def-item><def-item><term id="abb4">LLM</term><def><p>large language model</p></def></def-item><def-item><term id="abb5">MCQ</term><def><p>multiple-choice question</p></def></def-item><def-item><term id="abb6">RMA</term><def><p>resource-method-assessment</p></def></def-item><def-item><term id="abb7">SAQ</term><def><p>short-answer question</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Preiksaitis</surname><given-names>C</given-names> </name><name name-style="western"><surname>Rose</surname><given-names>C</given-names> </name></person-group><article-title>Opportunities, challenges, and future directions of generative artificial intelligence in medical education: scoping review</article-title><source>JMIR Med Educ</source><year>2023</year><month>10</month><day>20</day><volume>9</volume><fpage>e48785</fpage><pub-id pub-id-type="doi">10.2196/48785</pub-id><pub-id pub-id-type="medline">37862079</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="web"><article-title>Generative AI market (2025 - 2030)</article-title><source>Grand View Research</source><access-date>2025-03-03</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.grandviewresearch.com/industry-analysis/generative-ai-market-report">https://www.grandviewresearch.com/industry-analysis/generative-ai-market-report</ext-link></comment></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Stretton</surname><given-names>B</given-names> </name><name name-style="western"><surname>Kovoor</surname><given-names>J</given-names> </name><name name-style="western"><surname>Arnold</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bacchi</surname><given-names>S</given-names> </name></person-group><article-title>ChatGPT-based learning: generative artificial intelligence in medical education</article-title><source>Med Sci Educ</source><year>2024</year><month>02</month><volume>34</volume><issue>1</issue><fpage>215</fpage><lpage>217</lpage><pub-id pub-id-type="doi">10.1007/s40670-023-01934-5</pub-id><pub-id pub-id-type="medline">38510403</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dave</surname><given-names>T</given-names> </name><name name-style="western"><surname>Athaluri</surname><given-names>SA</given-names> </name><name name-style="western"><surname>Singh</surname><given-names>S</given-names> </name></person-group><article-title>ChatGPT in medicine: an overview of its applications, advantages, limitations, future prospects, and ethical considerations</article-title><source>Front Artif Intell</source><year>2023</year><volume>6</volume><fpage>1169595</fpage><pub-id pub-id-type="doi">10.3389/frai.2023.1169595</pub-id><pub-id pub-id-type="medline">37215063</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Karabacak</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ozkara</surname><given-names>BB</given-names> </name><name name-style="western"><surname>Margetis</surname><given-names>K</given-names> </name><name name-style="western"><surname>Wintermark</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bisdas</surname><given-names>S</given-names> </name></person-group><article-title>The advent of generative language models in medical education</article-title><source>JMIR Med Educ</source><year>2023</year><month>06</month><day>6</day><volume>9</volume><fpage>e48163</fpage><pub-id pub-id-type="doi">10.2196/48163</pub-id><pub-id pub-id-type="medline">37279048</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Totlis</surname><given-names>T</given-names> </name><name name-style="western"><surname>Natsis</surname><given-names>K</given-names> </name><name name-style="western"><surname>Filos</surname><given-names>D</given-names> </name><etal/></person-group><article-title>The potential role of ChatGPT and artificial intelligence in anatomy education: a conversation with ChatGPT</article-title><source>Surg Radiol Anat</source><year>2023</year><month>08</month><day>16</day><volume>45</volume><issue>10</issue><fpage>1321</fpage><lpage>1329</lpage><pub-id pub-id-type="doi">10.1007/s00276-023-03229-1</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Hanna</surname><given-names>JJ</given-names> </name><name name-style="western"><surname>Wakene</surname><given-names>AD</given-names> </name><name name-style="western"><surname>Lehmann</surname><given-names>CU</given-names> </name><name name-style="western"><surname>Medford</surname><given-names>RJ</given-names> </name></person-group><article-title>Assessing racial and ethnic bias in text generation for healthcare-related tasks by ChatGPT1</article-title><source>medRxiv</source><year>2023</year><month>08</month><day>28</day><fpage>2023.08.28.23294730</fpage><pub-id pub-id-type="doi">10.1101/2023.08.28.23294730</pub-id><pub-id pub-id-type="medline">37693388</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Densen</surname><given-names>P</given-names> </name></person-group><article-title>Challenges and opportunities facing medical education</article-title><source>Trans Am Clin Climatol Assoc</source><year>2011</year><volume>122</volume><fpage>48</fpage><lpage>58</lpage><pub-id pub-id-type="medline">21686208</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xu</surname><given-names>T</given-names> </name><name name-style="western"><surname>Weng</surname><given-names>H</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>F</given-names> </name><etal/></person-group><article-title>Current status of ChatGPT use in medical education: potentials, challenges, and strategies</article-title><source>J Med Internet Res</source><year>2024</year><month>08</month><day>28</day><volume>26</volume><fpage>e57896</fpage><pub-id pub-id-type="doi">10.2196/57896</pub-id><pub-id pub-id-type="medline">39196640</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Temsah</surname><given-names>O</given-names> </name><name name-style="western"><surname>Khan</surname><given-names>SA</given-names> </name><name name-style="western"><surname>Chaiah</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Overview of early ChatGPT&#x2019;s presence in medical literature: insights from a hybrid literature review by ChatGPT and human experts</article-title><source>Cureus</source><year>2023</year><month>04</month><volume>15</volume><issue>4</issue><fpage>e37281</fpage><pub-id pub-id-type="doi">10.7759/cureus.37281</pub-id><pub-id pub-id-type="medline">37038381</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Neff</surname><given-names>G</given-names> </name><name name-style="western"><surname>Nagy</surname><given-names>P</given-names> </name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Papacharissi</surname><given-names>Z</given-names> </name></person-group><article-title>Agency in the digital age: using symbiotic agency to explain human&#x2013;technology interaction</article-title><source>A Networked Self and Human Augmentics, Artificial Intelligence, Sentience</source><year>2018</year><edition>1</edition><publisher-name>Routledge</publisher-name><fpage>97</fpage><lpage>107</lpage><pub-id pub-id-type="doi">10.4324/9781315202082-8</pub-id><pub-id pub-id-type="other">978-1-315-20208-2</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="web"><article-title>The 22 best generative AI tools for SMBs to stay competitive in 2025</article-title><source>WebFX</source><access-date>2025-07-19</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.webfx.com/blog/marketing/best-generative-ai-tools/">https://www.webfx.com/blog/marketing/best-generative-ai-tools/</ext-link></comment></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Temsah</surname><given-names>MH</given-names> </name><name name-style="western"><surname>Alhuzaimi</surname><given-names>AN</given-names> </name><name name-style="western"><surname>Almansour</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Art or artifact: evaluating the accuracy, appeal, and educational value of AI-generated imagery in DALL&#x00B7;E 3 for illustrating congenital heart diseases</article-title><source>J Med Syst</source><year>2024</year><month>05</month><day>23</day><access-date>2025-07-19</access-date><volume>48</volume><issue>1</issue><fpage>54</fpage><comment><ext-link ext-link-type="uri" xlink:href="https://sciety.org/articles/activity/10.21203/rs.3.rs-3895175/v1">https://sciety.org/articles/activity/10.21203/rs.3.rs-3895175/v1</ext-link></comment><pub-id pub-id-type="doi">10.1007/s10916-024-02072-0</pub-id><pub-id pub-id-type="medline">38780839</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="web"><article-title>Claude 2: reviews, prices &#x0026; features</article-title><source>Appvizer</source><access-date>2025-07-19</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.appvizer.com/artificial-intelligence/llm/claude-2">https://www.appvizer.com/artificial-intelligence/llm/claude-2</ext-link></comment></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="report"><article-title>Global large language model (LLM) market research report 2024</article-title><year>2024</year><access-date>2025-10-09</access-date><publisher-name>QYResearch</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.qyresearch.com/reports/2212992/large-language-model--llm">https://www.qyresearch.com/reports/2212992/large-language-model--llm</ext-link></comment></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="web"><article-title>OpenAI&#x2019;s o3 - AI model details</article-title><source>DocsBot AI</source><access-date>2025-07-19</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://docsbot.ai/models/o3">https://docsbot.ai/models/o3</ext-link></comment></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="web"><article-title>OpeneVidence</article-title><source>AITop10</source><access-date>2025-07-19</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://aitop10.tools/zh/detail/openevidence">https://aitop10.tools/zh/detail/openevidence</ext-link></comment></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="web"><article-title>Sora Turbo: OpenAI&#x2019;s enhanced video generation model goes public</article-title><source>Neurohive</source><access-date>2025-07-19</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://neurohive.io/en/ai-apps/sora-turbo-openai-s-enhanced-video-generation-model-goes-public/">https://neurohive.io/en/ai-apps/sora-turbo-openai-s-enhanced-video-generation-model-goes-public/</ext-link></comment></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="web"><article-title>AI tools for medical education and research</article-title><source>Macon &#x0026; Joan Brock Virginia Health Sciences at Old Dominion University</source><access-date>2025-07-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.evms.edu/about_us/ai_resources/resources_and_ai_tools/ai_tools_for_medical_education_and_research/">https://www.evms.edu/about_us/ai_resources/resources_and_ai_tools/ai_tools_for_medical_education_and_research/</ext-link></comment></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Cho</surname><given-names>J</given-names> </name><name name-style="western"><surname>Puspitasari</surname><given-names>FD</given-names> </name><name name-style="western"><surname>Zheng</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Sora as an AGI world model? A complete survey on text-to-video generation</article-title><source>arXiv</source><comment>Preprint posted online on  Mar 8, 2024</comment><pub-id pub-id-type="doi">10.48550/ARXIV.2403.05131</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hu</surname><given-names>H</given-names> </name><name name-style="western"><surname>Liang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>H</given-names> </name></person-group><article-title>Longitudinal study of the earliest pilot of tiered healthcare system reforms in China: will the new type of chronic disease management be effective?</article-title><source>Soc Sci Med</source><year>2021</year><month>09</month><volume>285</volume><fpage>114284</fpage><pub-id pub-id-type="doi">10.1016/j.socscimed.2021.114284</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Peek</surname><given-names>CJ</given-names> </name><name name-style="western"><surname>Allen</surname><given-names>M</given-names> </name><name name-style="western"><surname>Loth</surname><given-names>KA</given-names> </name><etal/></person-group><article-title>Harmonizing the tripartite mission in academic family medicine: a longitudinal case example</article-title><source>Ann Fam Med</source><year>2024</year><volume>22</volume><issue>3</issue><fpage>237</fpage><lpage>243</lpage><pub-id pub-id-type="doi">10.1370/afm.3108</pub-id><pub-id pub-id-type="medline">38806264</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Geenens</surname><given-names>R</given-names> </name><name name-style="western"><surname>De Schutter</surname><given-names>H</given-names> </name></person-group><article-title>A tripartite model of federalism</article-title><source>Philos Soc Crit</source><year>2023</year><month>09</month><volume>49</volume><issue>7</issue><fpage>753</fpage><lpage>785</lpage><pub-id pub-id-type="doi">10.1177/01914537211066850</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Windak</surname><given-names>A</given-names> </name><name name-style="western"><surname>Rochfort</surname><given-names>A</given-names> </name><name name-style="western"><surname>Jacquet</surname><given-names>J</given-names> </name></person-group><article-title>The revised European definition of general practice/family medicine. a pivotal role of one health, planetary health and sustainable development goals</article-title><source>Eur J Gen Pract</source><year>2024</year><month>12</month><volume>30</volume><issue>1</issue><fpage>2306936</fpage><pub-id pub-id-type="doi">10.1080/13814788.2024.2306936</pub-id><pub-id pub-id-type="medline">38334099</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="report"><article-title>Human development report 2023-24</article-title><year>2024</year><month>03</month><access-date>2024-12-05</access-date><publisher-name>United Nations Development Programme</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://hdr.undp.org/content/human-development-report-2023-24">https://hdr.undp.org/content/human-development-report-2023-24</ext-link></comment></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gr&#x00E9;visse</surname><given-names>C</given-names> </name></person-group><article-title>LLM-based automatic short answer grading in undergraduate medical education</article-title><source>BMC Med Educ</source><year>2024</year><month>09</month><day>27</day><volume>24</volume><issue>1</issue><fpage>1060</fpage><pub-id pub-id-type="doi">10.1186/s12909-024-06026-5</pub-id><pub-id pub-id-type="medline">39334087</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>JQJ</given-names> </name><name name-style="western"><surname>Hui</surname><given-names>KTK</given-names> </name><name name-style="western"><surname>Al Zoubi</surname><given-names>F</given-names> </name><etal/></person-group><article-title>The great detectives: humans versus AI detectors in catching large language model-generated medical writing</article-title><source>Int J Educ Integr</source><year>2024</year><month>05</month><day>20</day><volume>20</volume><issue>1</issue><fpage>8</fpage><pub-id pub-id-type="doi">10.1007/s40979-024-00155-6</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zong</surname><given-names>H</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>E</given-names> </name><etal/></person-group><article-title>Exploring the potential of artificial intelligence to enhance the writing of english academic papers by non-native english-speaking medical students - the educational application of ChatGPT</article-title><source>BMC Med Educ</source><year>2024</year><month>07</month><day>9</day><volume>24</volume><issue>1</issue><pub-id pub-id-type="doi">10.1186/s12909-024-05738-y</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>KC</given-names> </name><name name-style="western"><surname>Bu</surname><given-names>ZJ</given-names> </name><name name-style="western"><surname>Shahjalal</surname><given-names>M</given-names> </name><etal/></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Grewal</surname><given-names>HS</given-names> </name></person-group><article-title>Performance of ChatGPT on Chinese master&#x2019;s degree entrance examination in clinical medicine</article-title><source>PLoS ONE</source><year>2024</year><volume>19</volume><issue>4</issue><fpage>e0301702</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0301702</pub-id><pub-id pub-id-type="medline">38573944</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cherif</surname><given-names>H</given-names> </name><name name-style="western"><surname>Moussa</surname><given-names>C</given-names> </name><name name-style="western"><surname>Missaoui</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Salouage</surname><given-names>I</given-names> </name><name name-style="western"><surname>Mokaddem</surname><given-names>S</given-names> </name><name name-style="western"><surname>Dhahri</surname><given-names>B</given-names> </name></person-group><article-title>Appraisal of ChatGPT&#x2019;s aptitude for medical education: comparative analysis with third-year medical students in a pulmonology examination</article-title><source>JMIR Med Educ</source><year>2024</year><month>07</month><day>23</day><volume>10</volume><fpage>e52818</fpage><pub-id pub-id-type="doi">10.2196/52818</pub-id><pub-id pub-id-type="medline">39042876</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ali</surname><given-names>K</given-names> </name><name name-style="western"><surname>Barhom</surname><given-names>N</given-names> </name><name name-style="western"><surname>Tamimi</surname><given-names>F</given-names> </name><name name-style="western"><surname>Duggal</surname><given-names>M</given-names> </name></person-group><article-title>ChatGPT&#x2014;A double&#x2010;edged sword for healthcare education? Implications for assessments of dental students</article-title><source>Eur J Dental Education</source><year>2024</year><month>02</month><volume>28</volume><issue>1</issue><fpage>206</fpage><lpage>211</lpage><pub-id pub-id-type="doi">10.1111/eje.12937</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Panthier</surname><given-names>C</given-names> </name><name name-style="western"><surname>Gatinel</surname><given-names>D</given-names> </name></person-group><article-title>Success of ChatGPT, an AI language model, in taking the French language version of the European Board of Ophthalmology examination: A novel approach to medical knowledge assessment</article-title><source>J Fr Ophtalmol</source><year>2023</year><month>09</month><volume>46</volume><issue>7</issue><fpage>706</fpage><lpage>711</lpage><pub-id pub-id-type="doi">10.1016/j.jfo.2023.05.006</pub-id><pub-id pub-id-type="medline">37537126</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gandhi</surname><given-names>AP</given-names> </name><name name-style="western"><surname>Joesph</surname><given-names>FK</given-names> </name><name name-style="western"><surname>Rajagopal</surname><given-names>V</given-names> </name><etal/></person-group><article-title>Performance of ChatGPT on the India undergraduate community medicine examination: cross-sectional study</article-title><source>JMIR Form Res</source><year>2024</year><month>03</month><day>25</day><volume>8</volume><fpage>e49964</fpage><pub-id pub-id-type="doi">10.2196/49964</pub-id><pub-id pub-id-type="medline">38526538</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yu</surname><given-names>P</given-names> </name><name name-style="western"><surname>Fang</surname><given-names>C</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Performance of ChatGPT on the Chinese postgraduate examination for clinical medicine: survey study</article-title><source>JMIR Med Educ</source><year>2024</year><month>02</month><day>9</day><volume>10</volume><fpage>e48514</fpage><pub-id pub-id-type="doi">10.2196/48514</pub-id><pub-id pub-id-type="medline">38335017</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Morreel</surname><given-names>S</given-names> </name><name name-style="western"><surname>Verhoeven</surname><given-names>V</given-names> </name><name name-style="western"><surname>Mathysen</surname><given-names>D</given-names> </name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Banerjee</surname><given-names>I</given-names> </name></person-group><article-title>Microsoft Bing outperforms five other generative artificial intelligence chatbots in the Antwerp University multiple choice medical license exam</article-title><source>PLOS Digit Health</source><year>2024</year><month>02</month><volume>3</volume><issue>2</issue><fpage>e0000349</fpage><pub-id pub-id-type="doi">10.1371/journal.pdig.0000349</pub-id><pub-id pub-id-type="medline">38354127</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Guerra</surname><given-names>GA</given-names> </name><name name-style="western"><surname>Hofmann</surname><given-names>H</given-names> </name><name name-style="western"><surname>Sobhani</surname><given-names>S</given-names> </name><etal/></person-group><article-title>GPT-4 artificial intelligence model outperforms ChatGPT, medical students, and neurosurgery residents on neurosurgery written board-like questions</article-title><source>World Neurosurg</source><year>2023</year><month>11</month><volume>179</volume><fpage>e160</fpage><lpage>e165</lpage><pub-id pub-id-type="doi">10.1016/j.wneu.2023.08.042</pub-id><pub-id pub-id-type="medline">37597659</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>RS</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>KJQ</given-names> </name><name name-style="western"><surname>Meaney</surname><given-names>C</given-names> </name><name name-style="western"><surname>Kemppainen</surname><given-names>J</given-names> </name><name name-style="western"><surname>Punnett</surname><given-names>A</given-names> </name><name name-style="western"><surname>Leung</surname><given-names>FH</given-names> </name></person-group><article-title>Assessment of resident and AI chatbot performance on the University of Toronto family medicine residency progress test: comparative study</article-title><source>JMIR Med Educ</source><year>2023</year><month>09</month><day>19</day><volume>9</volume><fpage>e50514</fpage><pub-id pub-id-type="doi">10.2196/50514</pub-id><pub-id pub-id-type="medline">37725411</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Watari</surname><given-names>T</given-names> </name><name name-style="western"><surname>Takagi</surname><given-names>S</given-names> </name><name name-style="western"><surname>Sakaguchi</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Performance comparison of ChatGPT-4 and Japanese medical residents in the general medicine in-training examination: comparison study</article-title><source>JMIR Med Educ</source><year>2023</year><month>12</month><day>6</day><volume>9</volume><fpage>e52202</fpage><pub-id pub-id-type="doi">10.2196/52202</pub-id><pub-id pub-id-type="medline">38055323</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Terwilliger</surname><given-names>E</given-names> </name><name name-style="western"><surname>Bcharah</surname><given-names>G</given-names> </name><name name-style="western"><surname>Bcharah</surname><given-names>H</given-names> </name><name name-style="western"><surname>Bcharah</surname><given-names>E</given-names> </name><name name-style="western"><surname>Richardson</surname><given-names>C</given-names> </name><name name-style="western"><surname>Scheffler</surname><given-names>P</given-names> </name></person-group><article-title>Advancing medical education: performance of generative artificial intelligence models on otolaryngology board preparation questions with image analysis insights</article-title><source>Cureus</source><year>2024</year><month>07</month><volume>16</volume><issue>7</issue><fpage>e64204</fpage><pub-id pub-id-type="doi">10.7759/cureus.64204</pub-id><pub-id pub-id-type="medline">39130878</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Revercomb</surname><given-names>L</given-names> </name><name name-style="western"><surname>Patel</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Fu</surname><given-names>D</given-names> </name><name name-style="western"><surname>Filimonov</surname><given-names>A</given-names> </name></person-group><article-title>Performance of novel GPT-4 in otolaryngology knowledge assessment</article-title><source>Indian J Otolaryngol Head Neck Surg</source><year>2024</year><month>12</month><volume>76</volume><issue>6</issue><fpage>6112</fpage><lpage>6114</lpage><pub-id pub-id-type="doi">10.1007/s12070-024-04935-x</pub-id><pub-id pub-id-type="medline">39559040</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Riedel</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kaefinger</surname><given-names>K</given-names> </name><name name-style="western"><surname>Stuehrenberg</surname><given-names>A</given-names> </name><etal/></person-group><article-title>ChatGPT&#x2019;s performance in German OB/GYN exams &#x2013; paving the way for AI-enhanced medical education and clinical practice</article-title><source>Front Med</source><year>2023</year><volume>10</volume><pub-id pub-id-type="doi">10.3389/fmed.2023.1296615</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Patel</surname><given-names>EA</given-names> </name><name name-style="western"><surname>Fleischer</surname><given-names>L</given-names> </name><name name-style="western"><surname>Filip</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Comparative performance of ChatGPT 3.5 and GPT4 on rhinology standardized board examination questions</article-title><source>OTO Open</source><year>2024</year><volume>8</volume><issue>2</issue><fpage>e164</fpage><pub-id pub-id-type="doi">10.1002/oto2.164</pub-id><pub-id pub-id-type="medline">38938507</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Takagi</surname><given-names>S</given-names> </name><name name-style="western"><surname>Watari</surname><given-names>T</given-names> </name><name name-style="western"><surname>Erabi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Sakaguchi</surname><given-names>K</given-names> </name></person-group><article-title>Performance of GPT-3.5 and GPT-4 on the Japanese medical licensing examination: comparison study</article-title><source>JMIR Med Educ</source><year>2023</year><month>06</month><day>29</day><volume>9</volume><fpage>e48002</fpage><pub-id pub-id-type="doi">10.2196/48002</pub-id><pub-id pub-id-type="medline">37384388</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Haddad</surname><given-names>F</given-names> </name><name name-style="western"><surname>Saade</surname><given-names>JS</given-names> </name></person-group><article-title>Performance of ChatGPT on ophthalmology-related questions across various examination levels: observational study</article-title><source>JMIR Med Educ</source><year>2024</year><month>01</month><day>18</day><volume>10</volume><fpage>e50842</fpage><pub-id pub-id-type="doi">10.2196/50842</pub-id><pub-id pub-id-type="medline">38236632</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gilson</surname><given-names>A</given-names> </name><name name-style="western"><surname>Safranek</surname><given-names>CW</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>T</given-names> </name><etal/></person-group><article-title>How does ChatGPT Perform on the United States Medical Licensing Examination (USMLE)? The implications of large language models for medical education and knowledge assessment</article-title><source>JMIR Med Educ</source><year>2023</year><month>02</month><day>8</day><volume>9</volume><fpage>e45312</fpage><pub-id pub-id-type="doi">10.2196/45312</pub-id><pub-id pub-id-type="medline">36753318</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Anderson</surname><given-names>LW</given-names> </name><name name-style="western"><surname>Krathwohl</surname><given-names>DR</given-names> </name></person-group><source>A Taxonomy For Learning, Teaching, And Assessing: A Revision Of Bloom&#x2019;s Taxonomy Of Educational Objectives</source><year>2001</year><publisher-name>Addison Wesley Longman, Inc</publisher-name><pub-id pub-id-type="other">0-321-08405-5</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yudovich</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Makarova</surname><given-names>E</given-names> </name><name name-style="western"><surname>Hague</surname><given-names>CM</given-names> </name><name name-style="western"><surname>Raman</surname><given-names>JD</given-names> </name></person-group><article-title>Performance of GPT-3.5 and GPT-4 on standardized urology knowledge assessment items in the United States: a descriptive study</article-title><source>J Educ Eval Health Prof</source><year>2024</year><volume>21</volume><issue>17</issue><fpage>17</fpage><pub-id pub-id-type="doi">10.3352/jeehp.2024.21.17</pub-id><pub-id pub-id-type="medline">38977032</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bharatha</surname><given-names>A</given-names> </name><name name-style="western"><surname>Ojeh</surname><given-names>N</given-names> </name><name name-style="western"><surname>Fazle Rabbi</surname><given-names>AM</given-names> </name><etal/></person-group><article-title>Comparing the performance of ChatGPT-4 and medical students on MCQs at varied levels of Bloom&#x2019;s taxonomy</article-title><source>Adv Med Educ Pract</source><year>2024</year><volume>15</volume><fpage>393</fpage><lpage>400</lpage><pub-id pub-id-type="doi">10.2147/AMEP.S457408</pub-id><pub-id pub-id-type="medline">38751805</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wong</surname><given-names>K</given-names> </name><name name-style="western"><surname>Fayngersh</surname><given-names>A</given-names> </name><name name-style="western"><surname>Traba</surname><given-names>C</given-names> </name><name name-style="western"><surname>Cennimo</surname><given-names>D</given-names> </name><name name-style="western"><surname>Kothari</surname><given-names>N</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>S</given-names> </name></person-group><article-title>Using ChatGPT in the development of clinical reasoning cases: a qualitative study</article-title><source>Cureus</source><year>2024</year><month>05</month><volume>16</volume><issue>5</issue><fpage>e61438</fpage><pub-id pub-id-type="doi">10.7759/cureus.61438</pub-id><pub-id pub-id-type="medline">38953081</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shimizu</surname><given-names>I</given-names> </name><name name-style="western"><surname>Kasai</surname><given-names>H</given-names> </name><name name-style="western"><surname>Shikino</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Developing medical education curriculum reform strategies to address the impact of generative AI: qualitative study</article-title><source>JMIR Med Educ</source><year>2023</year><month>11</month><day>30</day><volume>9</volume><fpage>e53466</fpage><pub-id pub-id-type="doi">10.2196/53466</pub-id><pub-id pub-id-type="medline">38032695</pub-id></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bakkum</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Hartjes</surname><given-names>MG</given-names> </name><name name-style="western"><surname>Pi&#x00EB;t</surname><given-names>JD</given-names> </name><etal/></person-group><article-title>Using artificial intelligence to create diverse and inclusive medical case vignettes for education</article-title><source>Brit J Clinical Pharma</source><year>2024</year><month>03</month><volume>90</volume><issue>3</issue><fpage>640</fpage><lpage>648</lpage><pub-id pub-id-type="doi">10.1111/bcp.15977</pub-id></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Smith</surname><given-names>A</given-names> </name><name name-style="western"><surname>Hachen</surname><given-names>S</given-names> </name><name name-style="western"><surname>Schleifer</surname><given-names>R</given-names> </name><name name-style="western"><surname>Bhugra</surname><given-names>D</given-names> </name><name name-style="western"><surname>Buadze</surname><given-names>A</given-names> </name><name name-style="western"><surname>Liebrenz</surname><given-names>M</given-names> </name></person-group><article-title>Old dog, new tricks? Exploring the potential functionalities of ChatGPT in supporting educational methods in social psychiatry</article-title><source>Int J Soc Psychiatry</source><year>2023</year><month>12</month><volume>69</volume><issue>8</issue><fpage>1882</fpage><lpage>1889</lpage><pub-id pub-id-type="doi">10.1177/00207640231178451</pub-id></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Scherr</surname><given-names>R</given-names> </name><name name-style="western"><surname>Halaseh</surname><given-names>FF</given-names> </name><name name-style="western"><surname>Spina</surname><given-names>A</given-names> </name><name name-style="western"><surname>Andalib</surname><given-names>S</given-names> </name><name name-style="western"><surname>Rivera</surname><given-names>R</given-names> </name></person-group><article-title>ChatGPT interactive medical simulations for early clinical education: case study</article-title><source>JMIR Med Educ</source><year>2023</year><month>11</month><day>10</day><volume>9</volume><fpage>e49877</fpage><pub-id pub-id-type="doi">10.2196/49877</pub-id><pub-id pub-id-type="medline">37948112</pub-id></nlm-citation></ref><ref id="ref54"><label>54</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sardesai</surname><given-names>N</given-names> </name><name name-style="western"><surname>Russo</surname><given-names>P</given-names> </name><name name-style="western"><surname>Martin</surname><given-names>J</given-names> </name><name name-style="western"><surname>Sardesai</surname><given-names>A</given-names> </name></person-group><article-title>Utilizing generative conversational artificial intelligence to create simulated patient encounters: a pilot study for anaesthesia training</article-title><source>Postgrad Med J</source><year>2024</year><month>03</month><day>18</day><volume>100</volume><issue>1182</issue><fpage>237</fpage><lpage>241</lpage><pub-id pub-id-type="doi">10.1093/postmj/qgad137</pub-id><pub-id pub-id-type="medline">38240054</pub-id></nlm-citation></ref><ref id="ref55"><label>55</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Magalh&#x00E3;es Araujo</surname><given-names>S</given-names> </name><name name-style="western"><surname>Cruz-Correia</surname><given-names>R</given-names> </name></person-group><article-title>Incorporating ChatGPT in medical informatics education: mixed methods study on student perceptions and experiential integration proposals</article-title><source>JMIR Med Educ</source><year>2024</year><month>03</month><day>20</day><volume>10</volume><fpage>e51151</fpage><pub-id pub-id-type="doi">10.2196/51151</pub-id><pub-id pub-id-type="medline">38506920</pub-id></nlm-citation></ref><ref id="ref56"><label>56</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Brennan</surname><given-names>L</given-names> </name><name name-style="western"><surname>Balakumar</surname><given-names>R</given-names> </name><name name-style="western"><surname>Bennett</surname><given-names>W</given-names> </name></person-group><article-title>The role of ChatGPT in enhancing ENT surgical training &#x2013; a trainees&#x2019; perspective</article-title><source>J Laryngol Otol</source><year>2024</year><month>05</month><volume>138</volume><issue>5</issue><fpage>480</fpage><lpage>486</lpage><pub-id pub-id-type="doi">10.1017/S0022215123001354</pub-id></nlm-citation></ref><ref id="ref57"><label>57</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tabuchi</surname><given-names>H</given-names> </name><name name-style="western"><surname>Engelmann</surname><given-names>J</given-names> </name><name name-style="western"><surname>Maeda</surname><given-names>F</given-names> </name><etal/></person-group><article-title>Using artificial intelligence to improve human performance: efficient retinal disease detection training with synthetic images</article-title><source>Br J Ophthalmol</source><year>2024</year><month>09</month><day>20</day><volume>108</volume><issue>10</issue><fpage>1430</fpage><lpage>1435</lpage><pub-id pub-id-type="doi">10.1136/bjo-2023-324923</pub-id><pub-id pub-id-type="medline">38485215</pub-id></nlm-citation></ref><ref id="ref58"><label>58</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Seth</surname><given-names>I</given-names> </name><name name-style="western"><surname>Lim</surname><given-names>B</given-names> </name><name name-style="western"><surname>Cevik</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Utilizing GPT-4 and generative artificial intelligence platforms for surgical education: an experimental study on skin ulcers</article-title><source>Eur J Plast Surg</source><year>2024</year><month>01</month><day>29</day><volume>47</volume><issue>1</issue><fpage>19</fpage><pub-id pub-id-type="doi">10.1007/s00238-024-02162-9</pub-id></nlm-citation></ref><ref id="ref59"><label>59</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fan</surname><given-names>BE</given-names> </name><name name-style="western"><surname>Chow</surname><given-names>M</given-names> </name><name name-style="western"><surname>Winkler</surname><given-names>S</given-names> </name></person-group><article-title>Artificial intelligence-generated facial images for medical education</article-title><source>MedSciEduc</source><year>2023</year><month>11</month><day>14</day><volume>34</volume><issue>1</issue><fpage>5</fpage><lpage>7</lpage><pub-id pub-id-type="doi">10.1007/s40670-023-01942-5</pub-id></nlm-citation></ref><ref id="ref60"><label>60</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Al-Worafi</surname><given-names>YM</given-names> </name><name name-style="western"><surname>Goh</surname><given-names>KW</given-names> </name><name name-style="western"><surname>Hermansyah</surname><given-names>A</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>CS</given-names> </name><name name-style="western"><surname>Ming</surname><given-names>LC</given-names> </name></person-group><article-title>The use of ChatGPT for education modules on integrated pharmacotherapy of infectious disease: educators&#x2019; perspectives</article-title><source>JMIR Med Educ</source><year>2024</year><month>01</month><day>12</day><volume>10</volume><fpage>e47339</fpage><pub-id pub-id-type="doi">10.2196/47339</pub-id><pub-id pub-id-type="medline">38214967</pub-id></nlm-citation></ref><ref id="ref61"><label>61</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Robleto</surname><given-names>E</given-names> </name><name name-style="western"><surname>Habashi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Kaplan</surname><given-names>MAB</given-names> </name><etal/></person-group><article-title>Medical students&#x2019; perceptions of an artificial intelligence (AI) assisted diagnosing program</article-title><source>Med Teach</source><year>2024</year><month>09</month><volume>46</volume><issue>9</issue><fpage>1180</fpage><lpage>1186</lpage><pub-id pub-id-type="doi">10.1080/0142159X.2024.2305369</pub-id><pub-id pub-id-type="medline">38306667</pub-id></nlm-citation></ref><ref id="ref62"><label>62</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>K&#x0131;yak</surname><given-names>YS</given-names> </name><name name-style="western"><surname>Kononowicz</surname><given-names>AA</given-names> </name></person-group><article-title>Case-based MCQ generator: a custom ChatGPT based on published prompts in the literature for automatic item generation</article-title><source>Med Teach</source><year>2024</year><month>08</month><day>2</day><volume>46</volume><issue>8</issue><fpage>1018</fpage><lpage>1020</lpage><pub-id pub-id-type="doi">10.1080/0142159X.2024.2314723</pub-id></nlm-citation></ref><ref id="ref63"><label>63</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tong</surname><given-names>L</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Rapaka</surname><given-names>S</given-names> </name><name name-style="western"><surname>Garg</surname><given-names>PS</given-names> </name></person-group><article-title>Can ChatGPT generate practice question explanations for medical students, a new faculty teaching tool?</article-title><source>Med Teach</source><year>2025</year><month>03</month><day>4</day><volume>47</volume><issue>3</issue><fpage>560</fpage><lpage>564</lpage><pub-id pub-id-type="doi">10.1080/0142159X.2024.2363486</pub-id></nlm-citation></ref><ref id="ref64"><label>64</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Artsi</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Sorin</surname><given-names>V</given-names> </name><name name-style="western"><surname>Konen</surname><given-names>E</given-names> </name><name name-style="western"><surname>Glicksberg</surname><given-names>BS</given-names> </name><name name-style="western"><surname>Nadkarni</surname><given-names>G</given-names> </name><name name-style="western"><surname>Klang</surname><given-names>E</given-names> </name></person-group><article-title>Large language models for generating medical examinations: systematic review</article-title><source>BMC Med Educ</source><year>2024</year><month>03</month><day>29</day><volume>24</volume><issue>1</issue><fpage>354</fpage><pub-id pub-id-type="doi">10.1186/s12909-024-05239-y</pub-id><pub-id pub-id-type="medline">38553693</pub-id></nlm-citation></ref><ref id="ref65"><label>65</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kawahara</surname><given-names>T</given-names> </name><name name-style="western"><surname>Sumi</surname><given-names>Y</given-names> </name></person-group><article-title>GPT-4/4V&#x2019;s performance on the Japanese National Medical Licensing Examination</article-title><source>Med Teach</source><year>2025</year><month>03</month><volume>47</volume><issue>3</issue><fpage>450</fpage><lpage>457</lpage><pub-id pub-id-type="doi">10.1080/0142159X.2024.2342545</pub-id><pub-id pub-id-type="medline">38648547</pub-id></nlm-citation></ref><ref id="ref66"><label>66</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tran</surname><given-names>CG</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Sherman</surname><given-names>SK</given-names> </name><name name-style="western"><surname>De Andrade</surname><given-names>JP</given-names> </name></person-group><article-title>Performance of ChatGPT on American Board of Surgery in-training examination preparation questions</article-title><source>J Surg Res</source><year>2024</year><month>07</month><volume>299</volume><fpage>329</fpage><lpage>335</lpage><pub-id pub-id-type="doi">10.1016/j.jss.2024.04.060</pub-id><pub-id pub-id-type="medline">38788470</pub-id></nlm-citation></ref><ref id="ref67"><label>67</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Botross</surname><given-names>M</given-names> </name><name name-style="western"><surname>Mohammadi</surname><given-names>SO</given-names> </name><name name-style="western"><surname>Montgomery</surname><given-names>K</given-names> </name><name name-style="western"><surname>Crawford</surname><given-names>C</given-names> </name></person-group><article-title>Performance of Google&#x2019;s artificial intelligence chatbot &#x201C;Bard&#x201D; (now &#x201C;Gemini&#x201D;) on ophthalmology board exam practice questions</article-title><source>Cureus</source><year>2024</year><month>03</month><volume>16</volume><issue>3</issue><fpage>e57348</fpage><pub-id pub-id-type="doi">10.7759/cureus.57348</pub-id><pub-id pub-id-type="medline">38690460</pub-id></nlm-citation></ref><ref id="ref68"><label>68</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gan</surname><given-names>W</given-names> </name><name name-style="western"><surname>Ouyang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Li</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Integrating ChatGPT in orthopedic education for medical undergraduates: randomized controlled trial</article-title><source>J Med Internet Res</source><year>2024</year><month>08</month><day>20</day><volume>26</volume><fpage>e57037</fpage><pub-id pub-id-type="doi">10.2196/57037</pub-id><pub-id pub-id-type="medline">39163598</pub-id></nlm-citation></ref><ref id="ref69"><label>69</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Thomae</surname><given-names>AV</given-names> </name><name name-style="western"><surname>Witt</surname><given-names>CM</given-names> </name><name name-style="western"><surname>Barth</surname><given-names>J</given-names> </name></person-group><article-title>Integration of ChatGPT into a course for medical students: explorative study on teaching scenarios, students&#x2019; perception, and applications</article-title><source>JMIR Med Educ</source><year>2024</year><month>08</month><day>22</day><volume>10</volume><fpage>e50545</fpage><pub-id pub-id-type="doi">10.2196/50545</pub-id><pub-id pub-id-type="medline">39177012</pub-id></nlm-citation></ref><ref id="ref70"><label>70</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Favero</surname><given-names>TG</given-names> </name></person-group><article-title>Using artificial intelligence platforms to support student learning in physiology</article-title><source>Adv Physiol Educ</source><year>2024</year><month>06</month><day>1</day><volume>48</volume><issue>2</issue><fpage>193</fpage><lpage>199</lpage><pub-id pub-id-type="doi">10.1152/advan.00213.2023</pub-id></nlm-citation></ref><ref id="ref71"><label>71</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ganjavi</surname><given-names>C</given-names> </name><name name-style="western"><surname>Eppler</surname><given-names>M</given-names> </name><name name-style="western"><surname>O&#x2019;Brien</surname><given-names>D</given-names> </name><etal/></person-group><article-title>ChatGPT and large language models (LLMs) awareness and use. A prospective cross-sectional survey of U.S. medical students</article-title><source>PLOS Digit Health</source><year>2024</year><month>09</month><volume>3</volume><issue>9</issue><fpage>e0000596</fpage><pub-id pub-id-type="doi">10.1371/journal.pdig.0000596</pub-id><pub-id pub-id-type="medline">39236008</pub-id></nlm-citation></ref><ref id="ref72"><label>72</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sallam</surname><given-names>M</given-names> </name><name name-style="western"><surname>Salim</surname><given-names>NA</given-names> </name><name name-style="western"><surname>Barakat</surname><given-names>M</given-names> </name><name name-style="western"><surname>Al-Tammemi</surname><given-names>AB</given-names> </name></person-group><article-title>ChatGPT applications in medical, dental, pharmacy, and public health education: A descriptive study highlighting the advantages and limitations</article-title><source>Narra J</source><year>2023</year><month>04</month><volume>3</volume><issue>1</issue><fpage>e103</fpage><pub-id pub-id-type="doi">10.52225/narra.v3i1.103</pub-id><pub-id pub-id-type="medline">38450035</pub-id></nlm-citation></ref><ref id="ref73"><label>73</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Arun</surname><given-names>G</given-names> </name><name name-style="western"><surname>Perumal</surname><given-names>V</given-names> </name><name name-style="western"><surname>Urias</surname><given-names>F</given-names> </name><etal/></person-group><article-title>ChatGPT versus a customized AI chatbot (Anatbuddy) for anatomy education: a comparative pilot study</article-title><source>Anatomical Sciences Ed</source><year>2024</year><month>10</month><volume>17</volume><issue>7</issue><pub-id pub-id-type="doi">10.1002/ase.2502</pub-id><pub-id pub-id-type="medline">39169464</pub-id></nlm-citation></ref><ref id="ref74"><label>74</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Deng</surname><given-names>A</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>W</given-names> </name><name name-style="western"><surname>Dai</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Current application of ChatGPT in undergraduate nuclear medicine education: Taking Chongqing Medical University as an example</article-title><source>Med Teach</source><year>2025</year><month>06</month><day>3</day><volume>47</volume><issue>6</issue><fpage>997</fpage><lpage>1003</lpage><pub-id pub-id-type="doi">10.1080/0142159X.2024.2399673</pub-id></nlm-citation></ref><ref id="ref75"><label>75</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Garabet</surname><given-names>R</given-names> </name><name name-style="western"><surname>Mackey</surname><given-names>BP</given-names> </name><name name-style="western"><surname>Cross</surname><given-names>J</given-names> </name><name name-style="western"><surname>Weingarten</surname><given-names>M</given-names> </name></person-group><article-title>ChatGPT-4 performance on USMLE step 1 style questions and its implications for medical education: a comparative study across systems and disciplines</article-title><source>MedSciEduc</source><year>2023</year><month>12</month><day>27</day><volume>34</volume><issue>1</issue><fpage>145</fpage><lpage>152</lpage><pub-id pub-id-type="doi">10.1007/s40670-023-01956-z</pub-id></nlm-citation></ref><ref id="ref76"><label>76</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Saleem</surname><given-names>N</given-names> </name><name name-style="western"><surname>Mufti</surname><given-names>T</given-names> </name><name name-style="western"><surname>Sohail</surname><given-names>SS</given-names> </name><name name-style="western"><surname>Madsen</surname><given-names>D&#x00D8;</given-names> </name></person-group><article-title>ChatGPT as an innovative heutagogical tool in medical education</article-title><source>Cogent Education</source><year>2024</year><month>12</month><day>31</day><volume>11</volume><issue>1</issue><fpage>2332850</fpage><pub-id pub-id-type="doi">10.1080/2331186X.2024.2332850</pub-id></nlm-citation></ref><ref id="ref77"><label>77</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>HC</given-names> </name></person-group><article-title>ChatGPT as a life coach for professional identity formation in medical education</article-title><source>Educational Technology &#x0026; Society</source><year>2024</year><access-date>2025-10-09</access-date><volume>27</volume><issue>3</issue><fpage>374</fpage><lpage>389</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://eric.ed.gov/?q=AI%2C+AND+data&#x0026;ff1=souEducational+Technology+%26+Society&#x0026;id=EJ1437405">https://eric.ed.gov/?q=AI%2C+AND+data&#x0026;ff1=souEducational+Technology+%26+Society&#x0026;id=EJ1437405</ext-link></comment></nlm-citation></ref><ref id="ref78"><label>78</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dhanvijay</surname><given-names>AKD</given-names> </name><name name-style="western"><surname>Pinjar</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Dhokane</surname><given-names>N</given-names> </name><name name-style="western"><surname>Sorte</surname><given-names>SR</given-names> </name><name name-style="western"><surname>Kumari</surname><given-names>A</given-names> </name><name name-style="western"><surname>Mondal</surname><given-names>H</given-names> </name></person-group><article-title>Performance of large language models (ChatGPT, Bing Search, and Google Bard) in solving case vignettes in physiology</article-title><source>Cureus</source><year>2023</year><month>08</month><volume>15</volume><issue>8</issue><fpage>e42972</fpage><pub-id pub-id-type="doi">10.7759/cureus.42972</pub-id><pub-id pub-id-type="medline">37671207</pub-id></nlm-citation></ref><ref id="ref79"><label>79</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>T</given-names> </name><name name-style="western"><surname>Mainous</surname><given-names>AG</given-names>  <suffix>3rd</suffix></name><name name-style="western"><surname>Stelter</surname><given-names>K</given-names> </name><name name-style="western"><surname>O&#x2019;Neill</surname><given-names>TR</given-names> </name><name name-style="western"><surname>Newton</surname><given-names>WP</given-names> </name></person-group><article-title>Performance evaluation of the generative pre-trained transformer (GPT-4) on the family medicine in-training examination</article-title><source>J Am Board Fam Med</source><year>2024</year><month>10</month><day>25</day><volume>37</volume><issue>4</issue><fpage>528</fpage><lpage>582</lpage><pub-id pub-id-type="doi">10.3122/jabfm.2023.230433R1</pub-id><pub-id pub-id-type="medline">39214695</pub-id></nlm-citation></ref><ref id="ref80"><label>80</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abdullahi</surname><given-names>T</given-names> </name><name name-style="western"><surname>Singh</surname><given-names>R</given-names> </name><name name-style="western"><surname>Eickhoff</surname><given-names>C</given-names> </name></person-group><article-title>Learning to make rare and complex diagnoses with generative AI assistance: qualitative study of popular large language models</article-title><source>JMIR Med Educ</source><year>2024</year><month>02</month><day>13</day><volume>10</volume><fpage>e51391</fpage><pub-id pub-id-type="doi">10.2196/51391</pub-id><pub-id pub-id-type="medline">38349725</pub-id></nlm-citation></ref><ref id="ref81"><label>81</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Guastafierro</surname><given-names>V</given-names> </name><name name-style="western"><surname>Corbitt</surname><given-names>DN</given-names> </name><name name-style="western"><surname>Bressan</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Unveiling the risks of ChatGPT in diagnostic surgical pathology</article-title><source>Virchows Arch</source><year>2025</year><month>04</month><volume>486</volume><issue>4</issue><fpage>663</fpage><lpage>673</lpage><pub-id pub-id-type="doi">10.1007/s00428-024-03918-1</pub-id><pub-id pub-id-type="medline">39269615</pub-id></nlm-citation></ref><ref id="ref82"><label>82</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sarangi</surname><given-names>PK</given-names> </name><name name-style="western"><surname>Irodi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Panda</surname><given-names>S</given-names> </name><name name-style="western"><surname>Nayak</surname><given-names>DSK</given-names> </name><name name-style="western"><surname>Mondal</surname><given-names>H</given-names> </name></person-group><article-title>Radiological differential diagnoses based on cardiovascular and thoracic imaging patterns: perspectives of four large language models</article-title><source>Indian J Radiol Imaging</source><year>2024</year><month>04</month><volume>34</volume><issue>2</issue><fpage>269</fpage><lpage>275</lpage><pub-id pub-id-type="doi">10.1055/s-0043-1777289</pub-id><pub-id pub-id-type="medline">38549881</pub-id></nlm-citation></ref><ref id="ref83"><label>83</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shukla</surname><given-names>R</given-names> </name><name name-style="western"><surname>Mishra</surname><given-names>AK</given-names> </name><name name-style="western"><surname>Banerjee</surname><given-names>N</given-names> </name><name name-style="western"><surname>Verma</surname><given-names>A</given-names> </name></person-group><article-title>The comparison of ChatGPT 3.5, Microsoft Bing, and Google Gemini for diagnosing cases of neuro-ophthalmology</article-title><source>Cureus</source><year>2024</year><month>04</month><volume>16</volume><issue>4</issue><fpage>e58232</fpage><pub-id pub-id-type="doi">10.7759/cureus.58232</pub-id><pub-id pub-id-type="medline">38745784</pub-id></nlm-citation></ref><ref id="ref84"><label>84</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hadi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Tran</surname><given-names>E</given-names> </name><name name-style="western"><surname>Nagarajan</surname><given-names>B</given-names> </name><name name-style="western"><surname>Kirpalani</surname><given-names>A</given-names> </name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Ata</surname><given-names>F</given-names> </name></person-group><article-title>Evaluation of ChatGPT as a diagnostic tool for medical learners and clinicians</article-title><source>PLoS ONE</source><year>2024</year><month>07</month><day>31</day><volume>19</volume><issue>7</issue><fpage>e0307383</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0307383</pub-id></nlm-citation></ref><ref id="ref85"><label>85</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Guthrie</surname><given-names>E</given-names> </name><name name-style="western"><surname>Levy</surname><given-names>D</given-names> </name><name name-style="western"><surname>Del Carmen</surname><given-names>G</given-names> </name></person-group><article-title>The Operating and Anesthetic Reference Assistant (OARA): A fine-tuned large language model for resident teaching</article-title><source>Am J Surg</source><year>2024</year><month>08</month><volume>234</volume><fpage>28</fpage><lpage>34</lpage><pub-id pub-id-type="doi">10.1016/j.amjsurg.2024.02.016</pub-id><pub-id pub-id-type="medline">38365551</pub-id></nlm-citation></ref><ref id="ref86"><label>86</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Hao</surname><given-names>Y</given-names> </name></person-group><article-title>Traditional Chinese medicine knowledge graph construction based on large language models</article-title><source>Electronics (Basel)</source><year>2024</year><month>07</month><volume>13</volume><issue>7</issue><fpage>1395</fpage><pub-id pub-id-type="doi">10.3390/electronics13071395</pub-id></nlm-citation></ref><ref id="ref87"><label>87</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Luke</surname><given-names>W</given-names> </name><name name-style="western"><surname>Seow Chong</surname><given-names>L</given-names> </name><name name-style="western"><surname>Ban</surname><given-names>KH</given-names> </name><etal/></person-group><article-title>Is ChatGPT &#x2018;ready&#x2019; to be a learning tool for medical undergraduates and will it perform equally in different subjects? Comparative study of ChatGPT performance in tutorial and case-based learning questions in physiology and biochemistry</article-title><source>Med Teach</source><year>2024</year><month>11</month><volume>46</volume><issue>11</issue><fpage>1441</fpage><lpage>1447</lpage><pub-id pub-id-type="doi">10.1080/0142159X.2024.2308779</pub-id></nlm-citation></ref><ref id="ref88"><label>88</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Oh</surname><given-names>N</given-names> </name><name name-style="western"><surname>Choi</surname><given-names>GS</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>WY</given-names> </name></person-group><article-title>ChatGPT goes to the operating room: evaluating GPT-4 performance and its potential in surgical education and training in the era of large language models</article-title><source>Ann Surg Treat Res</source><year>2023</year><month>05</month><volume>104</volume><issue>5</issue><fpage>269</fpage><lpage>273</lpage><pub-id pub-id-type="doi">10.4174/astr.2023.104.5.269</pub-id><pub-id pub-id-type="medline">37179699</pub-id></nlm-citation></ref><ref id="ref89"><label>89</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Guillen-Grima</surname><given-names>F</given-names> </name><name name-style="western"><surname>Guillen-Aguinaga</surname><given-names>S</given-names> </name><name name-style="western"><surname>Guillen-Aguinaga</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Evaluating the efficacy of ChatGPT in navigating the Spanish Medical Residency entrance examination (MIR): promising horizons for AI in clinical medicine</article-title><source>Clin Pract</source><year>2023</year><month>11</month><day>20</day><volume>13</volume><issue>6</issue><fpage>1460</fpage><lpage>1487</lpage><pub-id pub-id-type="doi">10.3390/clinpract13060130</pub-id><pub-id pub-id-type="medline">37987431</pub-id></nlm-citation></ref><ref id="ref90"><label>90</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lai</surname><given-names>UH</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>KS</given-names> </name><name name-style="western"><surname>Hsu</surname><given-names>TY</given-names> </name><name name-style="western"><surname>Kan</surname><given-names>JKC</given-names> </name></person-group><article-title>Evaluating the performance of ChatGPT-4 on the United Kingdom Medical Licensing Assessment</article-title><source>Front Med</source><year>2023</year><month>09</month><day>19</day><volume>10</volume><fpage>1240915</fpage><pub-id pub-id-type="doi">10.3389/fmed.2023.1240915</pub-id></nlm-citation></ref><ref id="ref91"><label>91</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Isleem</surname><given-names>UN</given-names> </name><name name-style="western"><surname>Zaidat</surname><given-names>B</given-names> </name><name name-style="western"><surname>Ren</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Can generative artificial intelligence pass the orthopaedic board examination?</article-title><source>J Orthop</source><year>2024</year><month>07</month><volume>53</volume><fpage>27</fpage><lpage>33</lpage><pub-id pub-id-type="doi">10.1016/j.jor.2023.10.026</pub-id></nlm-citation></ref><ref id="ref92"><label>92</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mackey</surname><given-names>BP</given-names> </name><name name-style="western"><surname>Garabet</surname><given-names>R</given-names> </name><name name-style="western"><surname>Maule</surname><given-names>L</given-names> </name><name name-style="western"><surname>Tadesse</surname><given-names>A</given-names> </name><name name-style="western"><surname>Cross</surname><given-names>J</given-names> </name><name name-style="western"><surname>Weingarten</surname><given-names>M</given-names> </name></person-group><article-title>Evaluating ChatGPT-4 in medical education: an assessment of subject exam performance reveals limitations in clinical curriculum support for students</article-title><source>Discov Artif Intell</source><year>2024</year><month>05</month><day>16</day><volume>4</volume><issue>1</issue><fpage>38</fpage><pub-id pub-id-type="doi">10.1007/s44163-024-00135-2</pub-id></nlm-citation></ref><ref id="ref93"><label>93</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jaworski</surname><given-names>A</given-names> </name><name name-style="western"><surname>Jasi&#x0144;ski</surname><given-names>D</given-names> </name><name name-style="western"><surname>Jaworski</surname><given-names>W</given-names> </name><etal/></person-group><article-title>Comparison of the performance of artificial intelligence versus medical professionals in the Polish Final Medical Examination</article-title><source>Cureus</source><year>2024</year><month>08</month><volume>16</volume><issue>8</issue><fpage>e66011</fpage><pub-id pub-id-type="doi">10.7759/cureus.66011</pub-id><pub-id pub-id-type="medline">39221376</pub-id></nlm-citation></ref><ref id="ref94"><label>94</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abbas</surname><given-names>A</given-names> </name><name name-style="western"><surname>Rehman</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Rehman</surname><given-names>SS</given-names> </name></person-group><article-title>Comparing the performance of popular large language models on the National Board of Medical Examiners sample questions</article-title><source>Cureus</source><year>2024</year><month>03</month><volume>16</volume><issue>3</issue><fpage>e55991</fpage><pub-id pub-id-type="doi">10.7759/cureus.55991</pub-id><pub-id pub-id-type="medline">38606229</pub-id></nlm-citation></ref><ref id="ref95"><label>95</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Goodings</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>Kajitani</surname><given-names>S</given-names> </name><name name-style="western"><surname>Chhor</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Assessment of ChatGPT-4 in family medicine board examinations using advanced AI learning and analytical methods: observational study</article-title><source>JMIR Med Educ</source><year>2024</year><month>10</month><day>8</day><volume>10</volume><fpage>e56128</fpage><pub-id pub-id-type="doi">10.2196/56128</pub-id><pub-id pub-id-type="medline">39378442</pub-id></nlm-citation></ref><ref id="ref96"><label>96</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jin</surname><given-names>HK</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>HE</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>E</given-names> </name></person-group><article-title>Performance of ChatGPT-3.5 and GPT-4 in national licensing examinations for medicine, pharmacy, dentistry, and nursing: a systematic review and meta-analysis</article-title><source>BMC Med Educ</source><year>2024</year><month>09</month><day>16</day><volume>24</volume><issue>1</issue><pub-id pub-id-type="doi">10.1186/s12909-024-05944-8</pub-id></nlm-citation></ref><ref id="ref97"><label>97</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lucas</surname><given-names>HC</given-names> </name><name name-style="western"><surname>Upperman</surname><given-names>JS</given-names> </name><name name-style="western"><surname>Robinson</surname><given-names>JR</given-names> </name></person-group><article-title>A systematic review of large language models and their implications in medical education</article-title><source>Med Educ (Chicago Ill)</source><year>2024</year><month>11</month><volume>58</volume><issue>11</issue><fpage>1276</fpage><lpage>1285</lpage><pub-id pub-id-type="doi">10.1111/medu.15402</pub-id></nlm-citation></ref><ref id="ref98"><label>98</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alkhaaldi</surname><given-names>SMI</given-names> </name><name name-style="western"><surname>Kassab</surname><given-names>CH</given-names> </name><name name-style="western"><surname>Dimassi</surname><given-names>Z</given-names> </name><etal/></person-group><article-title>Medical student experiences and perceptions of ChatGPT and artificial intelligence: cross-sectional study</article-title><source>JMIR Med Educ</source><year>2023</year><month>12</month><day>22</day><volume>9</volume><fpage>e51302</fpage><pub-id pub-id-type="doi">10.2196/51302</pub-id><pub-id pub-id-type="medline">38133911</pub-id></nlm-citation></ref><ref id="ref99"><label>99</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hersh</surname><given-names>W</given-names> </name><name name-style="western"><surname>Fultz Hollis</surname><given-names>K</given-names> </name></person-group><article-title>Results and implications for generative AI in a large introductory biomedical and health informatics course</article-title><source>NPJ Digit Med</source><year>2024</year><month>09</month><day>13</day><volume>7</volume><issue>1</issue><fpage>247</fpage><pub-id pub-id-type="doi">10.1038/s41746-024-01251-0</pub-id><pub-id pub-id-type="medline">39271955</pub-id></nlm-citation></ref><ref id="ref100"><label>100</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Altamimi</surname><given-names>I</given-names> </name><name name-style="western"><surname>Alhumimidi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Alshehri</surname><given-names>S</given-names> </name><etal/></person-group><article-title>The scientific knowledge of three large language models in cardiology: multiple-choice questions examination-based performance</article-title><source>Annals of Medicine &#x0026; Surgery</source><year>2024</year><month>05</month><day>3</day><volume>86</volume><issue>6</issue><fpage>3261</fpage><lpage>3266</lpage><pub-id pub-id-type="doi">10.1097/MS9.0000000000002120</pub-id></nlm-citation></ref><ref id="ref101"><label>101</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hou</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Guo</surname><given-names>L</given-names> </name><name name-style="western"><surname>Luo</surname><given-names>F</given-names> </name></person-group><article-title>Conflict of interest the authors declare that they have no conflict of interest</article-title><source>SSRN Journal</source><year>2022</year><pub-id pub-id-type="doi">10.2139/ssrn.4258054</pub-id></nlm-citation></ref><ref id="ref102"><label>102</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zong</surname><given-names>H</given-names> </name><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>E</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>R</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Shen</surname><given-names>B</given-names> </name></person-group><article-title>Performance of ChatGPT on Chinese national medical licensing examinations: a five-year examination evaluation study for physicians, pharmacists and nurses</article-title><source>BMC Med Educ</source><year>2024</year><month>02</month><day>14</day><volume>24</volume><issue>1</issue><fpage>143</fpage><pub-id pub-id-type="doi">10.1186/s12909-024-05125-7</pub-id><pub-id pub-id-type="medline">38355517</pub-id></nlm-citation></ref><ref id="ref103"><label>103</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bongco</surname><given-names>EDA</given-names> </name><name name-style="western"><surname>Cua</surname><given-names>SKN</given-names> </name><name name-style="western"><surname>Hernandez</surname><given-names>M</given-names> </name><name name-style="western"><surname>Pascual</surname><given-names>JSG</given-names> </name><name name-style="western"><surname>Khu</surname><given-names>KJO</given-names> </name></person-group><article-title>The performance of ChatGPT versus neurosurgery residents in neurosurgical board examination-like questions: a systematic review and meta-analysis</article-title><source>Neurosurg Rev</source><year>2024</year><month>12</month><day>7</day><volume>47</volume><issue>1</issue><fpage>892</fpage><pub-id pub-id-type="doi">10.1007/s10143-024-03144-y</pub-id><pub-id pub-id-type="medline">39643792</pub-id></nlm-citation></ref><ref id="ref104"><label>104</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cuthbert</surname><given-names>R</given-names> </name><name name-style="western"><surname>Simpson</surname><given-names>AI</given-names> </name></person-group><article-title>Artificial intelligence in orthopaedics: can Chat Generative Pre-trained Transformer (ChatGPT) pass Section 1 of the Fellowship of the Royal College of Surgeons (Trauma &#x0026; Orthopaedics) examination?</article-title><source>Postgrad Med J</source><year>2023</year><month>09</month><day>21</day><volume>99</volume><issue>1176</issue><fpage>1110</fpage><lpage>1114</lpage><pub-id pub-id-type="doi">10.1093/postmj/qgad053</pub-id><pub-id pub-id-type="medline">37410674</pub-id></nlm-citation></ref><ref id="ref105"><label>105</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tangadulrat</surname><given-names>P</given-names> </name><name name-style="western"><surname>Sono</surname><given-names>S</given-names> </name><name name-style="western"><surname>Tangtrakulwanich</surname><given-names>B</given-names> </name></person-group><article-title>Using ChatGPT for clinical practice and medical education: cross-sectional survey of medical students&#x2019; and physicians&#x2019; perceptions</article-title><source>JMIR Med Educ</source><year>2023</year><month>12</month><day>22</day><volume>9</volume><fpage>e50658</fpage><pub-id pub-id-type="doi">10.2196/50658</pub-id><pub-id pub-id-type="medline">38133908</pub-id></nlm-citation></ref><ref id="ref106"><label>106</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nicikowski</surname><given-names>J</given-names> </name><name name-style="western"><surname>Szczepa&#x0144;ski</surname><given-names>M</given-names> </name><name name-style="western"><surname>Miedziaszczyk</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kudli&#x0144;ski</surname><given-names>B</given-names> </name></person-group><article-title>The potential of ChatGPT in medicine: an example analysis of nephrology specialty exams in Poland</article-title><source>Clin Kidney J</source><year>2024</year><month>08</month><volume>17</volume><issue>8</issue><fpage>sfae193</fpage><pub-id pub-id-type="doi">10.1093/ckj/sfae193</pub-id><pub-id pub-id-type="medline">39099569</pub-id></nlm-citation></ref><ref id="ref107"><label>107</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Borchert</surname><given-names>RJ</given-names> </name><name name-style="western"><surname>Hickman</surname><given-names>CR</given-names> </name><name name-style="western"><surname>Pepys</surname><given-names>J</given-names> </name><name name-style="western"><surname>Sadler</surname><given-names>TJ</given-names> </name></person-group><article-title>Performance of ChatGPT on the situational judgement test-a professional dilemmas-based examination for doctors in the United Kingdom</article-title><source>JMIR Med Educ</source><year>2023</year><month>08</month><day>7</day><volume>9</volume><fpage>e48978</fpage><pub-id pub-id-type="doi">10.2196/48978</pub-id><pub-id pub-id-type="medline">37548997</pub-id></nlm-citation></ref><ref id="ref108"><label>108</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hudon</surname><given-names>A</given-names> </name><name name-style="western"><surname>Kiepura</surname><given-names>B</given-names> </name><name name-style="western"><surname>Pelletier</surname><given-names>M</given-names> </name><name name-style="western"><surname>Phan</surname><given-names>V</given-names> </name></person-group><article-title>Using ChatGPT in psychiatry to design script concordance tests in undergraduate medical education: mixed methods study</article-title><source>JMIR Med Educ</source><year>2024</year><month>04</month><day>4</day><volume>10</volume><fpage>e54067</fpage><pub-id pub-id-type="doi">10.2196/54067</pub-id><pub-id pub-id-type="medline">38596832</pub-id></nlm-citation></ref><ref id="ref109"><label>109</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Agarwal</surname><given-names>M</given-names> </name><name name-style="western"><surname>Sharma</surname><given-names>P</given-names> </name><name name-style="western"><surname>Goswami</surname><given-names>A</given-names> </name></person-group><article-title>Analysing the applicability of ChatGPT, Bard, and Bing to generate reasoning-based multiple-choice questions in medical physiology</article-title><source>Cureus</source><year>2023</year><month>06</month><volume>15</volume><issue>6</issue><fpage>e40977</fpage><pub-id pub-id-type="doi">10.7759/cureus.40977</pub-id><pub-id pub-id-type="medline">37519497</pub-id></nlm-citation></ref><ref id="ref110"><label>110</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wu</surname><given-names>JH</given-names> </name><name name-style="western"><surname>Nishida</surname><given-names>T</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>TYA</given-names> </name></person-group><article-title>Accuracy of large language models in answering ophthalmology board-style questions: A meta-analysis</article-title><source>Asia Pac J Ophthalmol (Phila)</source><year>2024</year><month>09</month><volume>13</volume><issue>5</issue><fpage>100106</fpage><pub-id pub-id-type="doi">10.1016/j.apjo.2024.100106</pub-id></nlm-citation></ref><ref id="ref111"><label>111</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Torres-Zegarra</surname><given-names>BC</given-names> </name><name name-style="western"><surname>Rios-Garcia</surname><given-names>W</given-names> </name><name name-style="western"><surname>&#x00D1;a&#x00F1;a-Cordova</surname><given-names>AM</given-names> </name><etal/></person-group><article-title>Performance of ChatGPT, Bard, Claude, and Bing on the Peruvian National Licensing Medical Examination: a cross-sectional study</article-title><source>J Educ Eval Health Prof</source><year>2023</year><volume>20</volume><fpage>30</fpage><pub-id pub-id-type="doi">10.3352/jeehp.2023.20.30</pub-id><pub-id pub-id-type="medline">37981579</pub-id></nlm-citation></ref><ref id="ref112"><label>112</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Weng</surname><given-names>TL</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>YM</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>S</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>TJ</given-names> </name><name name-style="western"><surname>Hwang</surname><given-names>SJ</given-names> </name></person-group><article-title>ChatGPT failed Taiwan&#x2019;s Family Medicine Board Exam</article-title><source>J Chin Med Assoc</source><year>2023</year><month>08</month><day>1</day><volume>86</volume><issue>8</issue><fpage>762</fpage><lpage>766</lpage><pub-id pub-id-type="doi">10.1097/JCMA.0000000000000946</pub-id><pub-id pub-id-type="medline">37294147</pub-id></nlm-citation></ref><ref id="ref113"><label>113</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yoon</surname><given-names>SH</given-names> </name><name name-style="western"><surname>Oh</surname><given-names>SK</given-names> </name><name name-style="western"><surname>Lim</surname><given-names>BG</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>HJ</given-names> </name></person-group><article-title>Performance of ChatGPT in the in-training examination for anesthesiology and pain medicine residents in South Korea: observational study</article-title><source>JMIR Med Educ</source><year>2024</year><month>09</month><day>16</day><volume>10</volume><fpage>e56859</fpage><pub-id pub-id-type="doi">10.2196/56859</pub-id><pub-id pub-id-type="medline">39284182</pub-id></nlm-citation></ref><ref id="ref114"><label>114</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>W</given-names> </name><name name-style="western"><surname>Dou</surname><given-names>Z</given-names> </name><name name-style="western"><surname>He</surname><given-names>L</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>L</given-names> </name></person-group><article-title>Performance and exploration of ChatGPT in medical examination, records and education in Chinese: Pave the way for medical AI</article-title><source>Int J Med Inform</source><year>2023</year><month>09</month><volume>177</volume><fpage>105173</fpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2023.105173</pub-id></nlm-citation></ref><ref id="ref115"><label>115</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Keshtkar</surname><given-names>A</given-names> </name><name name-style="western"><surname>Atighi</surname><given-names>F</given-names> </name><name name-style="western"><surname>Reihani</surname><given-names>H</given-names> </name></person-group><article-title>Systematic review of ChatGPT accuracy and performance in Iran&#x2019;s medical licensing exams: A brief report</article-title><source>J Educ Health Promot</source><year>2024</year><month>11</month><volume>13</volume><issue>1</issue><fpage>421</fpage><pub-id pub-id-type="doi">10.4103/jehp.jehp_1210_24</pub-id></nlm-citation></ref><ref id="ref116"><label>116</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>M</given-names> </name><name name-style="western"><surname>Okuhara</surname><given-names>T</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Performance of ChatGPT across different versions in medical licensing examinations worldwide: systematic review and meta-analysis</article-title><source>J Med Internet Res</source><year>2024</year><month>07</month><day>25</day><volume>26</volume><fpage>e60807</fpage><pub-id pub-id-type="doi">10.2196/60807</pub-id><pub-id pub-id-type="medline">39052324</pub-id></nlm-citation></ref><ref id="ref117"><label>117</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ali</surname><given-names>R</given-names> </name><name name-style="western"><surname>Tang</surname><given-names>OY</given-names> </name><name name-style="western"><surname>Connolly</surname><given-names>ID</given-names> </name><etal/></person-group><article-title>Performance of ChatGPT and GPT-4 on neurosurgery written board examinations</article-title><source>Neurosurgery</source><year>2023</year><month>12</month><day>1</day><volume>93</volume><issue>6</issue><fpage>1353</fpage><lpage>1365</lpage><pub-id pub-id-type="doi">10.1227/neu.0000000000002632</pub-id><pub-id pub-id-type="medline">37581444</pub-id></nlm-citation></ref><ref id="ref118"><label>118</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Elias</surname><given-names>ML</given-names> </name><name name-style="western"><surname>Burshtein</surname><given-names>J</given-names> </name><name name-style="western"><surname>Sharon</surname><given-names>VR</given-names> </name></person-group><article-title>OpenAI&#x2019;s GPT&#x2010;4 performs to a high degree on board&#x2010;style dermatology questions</article-title><source>Int J Dermatology</source><year>2024</year><month>01</month><volume>63</volume><issue>1</issue><fpage>73</fpage><lpage>78</lpage><pub-id pub-id-type="doi">10.1111/ijd.16913</pub-id></nlm-citation></ref><ref id="ref119"><label>119</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sabri</surname><given-names>H</given-names> </name><name name-style="western"><surname>Saleh</surname><given-names>MHA</given-names> </name><name name-style="western"><surname>Hazrati</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Performance of three artificial intelligence (AI)&#x2010;based large language models in standardized testing; implications for AI&#x2010;assisted dental education</article-title><source>J of Periodontal Research</source><year>2025</year><month>02</month><volume>60</volume><issue>2</issue><fpage>121</fpage><lpage>133</lpage><pub-id pub-id-type="doi">10.1111/jre.13323</pub-id></nlm-citation></ref><ref id="ref120"><label>120</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ilgaz</surname><given-names>HB</given-names> </name><name name-style="western"><surname>&#x00C7;elik</surname><given-names>Z</given-names> </name></person-group><article-title>The significance of artificial intelligence platforms in anatomy education: an experience with ChatGPT and Google Bard</article-title><source>Cureus</source><year>2023</year><month>09</month><volume>15</volume><issue>9</issue><fpage>e45301</fpage><pub-id pub-id-type="doi">10.7759/cureus.45301</pub-id><pub-id pub-id-type="medline">37846274</pub-id></nlm-citation></ref><ref id="ref121"><label>121</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Khorshidi</surname><given-names>H</given-names> </name><name name-style="western"><surname>Mohammadi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Yousem</surname><given-names>DM</given-names> </name><etal/></person-group><article-title>Application of ChatGPT in multilingual medical education: How does ChatGPT fare in 2023&#x2019;s Iranian residency entrance examination</article-title><source>Informatics in Medicine Unlocked</source><year>2023</year><volume>41</volume><fpage>101314</fpage><pub-id pub-id-type="doi">10.1016/j.imu.2023.101314</pub-id></nlm-citation></ref><ref id="ref122"><label>122</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>CH</given-names> </name><name name-style="western"><surname>Hsiao</surname><given-names>HJ</given-names> </name><name name-style="western"><surname>Yeh</surname><given-names>PC</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>KC</given-names> </name><name name-style="western"><surname>Kao</surname><given-names>CH</given-names> </name></person-group><article-title>Performance of ChatGPT on Stage 1 of the Taiwanese medical licensing exam</article-title><source>Digit HEALTH</source><year>2024</year><volume>10</volume><fpage>20552076241233144</fpage><pub-id pub-id-type="doi">10.1177/20552076241233144</pub-id><pub-id pub-id-type="medline">38371244</pub-id></nlm-citation></ref><ref id="ref123"><label>123</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Apornvirat</surname><given-names>S</given-names> </name><name name-style="western"><surname>Namboonlue</surname><given-names>C</given-names> </name><name name-style="western"><surname>Laohawetwanit</surname><given-names>T</given-names> </name></person-group><article-title>Comparative analysis of ChatGPT and Bard in answering pathology examination questions requiring image interpretation</article-title><source>Am J Clin Pathol</source><year>2024</year><month>09</month><day>3</day><volume>162</volume><issue>3</issue><fpage>252</fpage><lpage>260</lpage><pub-id pub-id-type="doi">10.1093/ajcp/aqae036</pub-id></nlm-citation></ref><ref id="ref124"><label>124</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cross</surname><given-names>J</given-names> </name><name name-style="western"><surname>Robinson</surname><given-names>R</given-names> </name><name name-style="western"><surname>Devaraju</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Transforming medical education: assessing the integration of ChatGPT into faculty workflows at a Caribbean medical school</article-title><source>Cureus</source><year>2023</year><month>07</month><volume>15</volume><issue>7</issue><fpage>e41399</fpage><pub-id pub-id-type="doi">10.7759/cureus.41399</pub-id><pub-id pub-id-type="medline">37426402</pub-id></nlm-citation></ref><ref id="ref125"><label>125</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Soulage</surname><given-names>CO</given-names> </name><name name-style="western"><surname>Van Coppenolle</surname><given-names>F</given-names> </name><name name-style="western"><surname>Guebre-Egziabher</surname><given-names>F</given-names> </name></person-group><article-title>The conversational AI &#x201C;ChatGPT&#x201D; outperforms medical students on a physiology university examination</article-title><source>Adv Physiol Educ</source><year>2024</year><month>12</month><day>1</day><volume>48</volume><issue>4</issue><fpage>677</fpage><lpage>684</lpage><pub-id pub-id-type="doi">10.1152/advan.00181.2023</pub-id><pub-id pub-id-type="medline">38991037</pub-id></nlm-citation></ref><ref id="ref126"><label>126</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gritti</surname><given-names>MN</given-names> </name><name name-style="western"><surname>AlTurki</surname><given-names>H</given-names> </name><name name-style="western"><surname>Farid</surname><given-names>P</given-names> </name><name name-style="western"><surname>Morgan</surname><given-names>CT</given-names> </name></person-group><article-title>Progression of an artificial intelligence chatbot (ChatGPT) for pediatric cardiology educational knowledge assessment</article-title><source>Pediatr Cardiol</source><year>2024</year><month>02</month><volume>45</volume><issue>2</issue><fpage>309</fpage><lpage>313</lpage><pub-id pub-id-type="doi">10.1007/s00246-023-03385-6</pub-id><pub-id pub-id-type="medline">38170274</pub-id></nlm-citation></ref><ref id="ref127"><label>127</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bartoli</surname><given-names>A</given-names> </name><name name-style="western"><surname>May</surname><given-names>AT</given-names> </name><name name-style="western"><surname>Al-Awadhi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Schaller</surname><given-names>K</given-names> </name></person-group><article-title>Probing artificial intelligence in neurosurgical training: ChatGPT takes a neurosurgical residents written exam</article-title><source>Brain Spine</source><year>2024</year><volume>4</volume><fpage>102715</fpage><pub-id pub-id-type="doi">10.1016/j.bas.2023.102715</pub-id><pub-id pub-id-type="medline">38163001</pub-id></nlm-citation></ref><ref id="ref128"><label>128</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rasmussen</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Akbarov</surname><given-names>K</given-names> </name><name name-style="western"><surname>Titovich</surname><given-names>E</given-names> </name><etal/></person-group><article-title>Potential of e-learning interventions and artificial intelligence-assisted contouring skills in radiotherapy: the ELAISA study</article-title><source>JCO Glob Oncol</source><year>2024</year><month>08</month><volume>10</volume><issue>10</issue><fpage>e2400173</fpage><pub-id pub-id-type="doi">10.1200/GO.24.00173</pub-id><pub-id pub-id-type="medline">39236283</pub-id></nlm-citation></ref><ref id="ref129"><label>129</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mousavi</surname><given-names>M</given-names> </name><name name-style="western"><surname>Shafiee</surname><given-names>S</given-names> </name><name name-style="western"><surname>Harley</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Cheung</surname><given-names>JCK</given-names> </name><name name-style="western"><surname>Abbasgholizadeh Rahimi</surname><given-names>S</given-names> </name></person-group><article-title>Performance of generative pre-trained transformers (GPTs) in Certification Examination of the College of Family Physicians of Canada</article-title><source>Fam Med Com Health</source><year>2024</year><month>05</month><volume>12</volume><issue>Suppl 1</issue><fpage>e002626</fpage><pub-id pub-id-type="doi">10.1136/fmch-2023-002626</pub-id></nlm-citation></ref><ref id="ref130"><label>130</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Temsah</surname><given-names>MH</given-names> </name><name name-style="western"><surname>Alhuzaimi</surname><given-names>AN</given-names> </name><name name-style="western"><surname>Almansour</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Art or artifact: evaluating the accuracy, appeal, and educational value of AI-generated imagery in DALL&#x00B7;E 3 for illustrating congenital heart diseases</article-title><source>J Med Syst</source><year>2024</year><month>05</month><day>23</day><volume>48</volume><issue>1</issue><fpage>54</fpage><pub-id pub-id-type="doi">10.1007/s10916-024-02072-0</pub-id><pub-id pub-id-type="medline">38780839</pub-id></nlm-citation></ref><ref id="ref131"><label>131</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fang</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Reynaldi</surname><given-names>R</given-names> </name><name name-style="western"><surname>Araminta</surname><given-names>AS</given-names> </name><etal/></person-group><article-title>Artificial intelligence (AI)-driven dental education: exploring the role of chatbots in a clinical learning environment</article-title><source>J Prosthet Dent</source><year>2025</year><month>10</month><volume>134</volume><issue>4</issue><fpage>1296</fpage><lpage>1303</lpage><pub-id pub-id-type="doi">10.1016/j.prosdent.2024.03.038</pub-id><pub-id pub-id-type="medline">38644064</pub-id></nlm-citation></ref><ref id="ref132"><label>132</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cheung</surname><given-names>BHH</given-names> </name><name name-style="western"><surname>Lau</surname><given-names>GKK</given-names> </name><name name-style="western"><surname>Wong</surname><given-names>GTC</given-names> </name><etal/></person-group><article-title>ChatGPT versus human in generating medical graduate exam multiple choice questions-A multinational prospective study (Hong Kong S.A.R., Singapore, Ireland, and the United Kingdom)</article-title><source>PLoS ONE</source><year>2023</year><volume>18</volume><issue>8</issue><fpage>e0290691</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0290691</pub-id><pub-id pub-id-type="medline">37643186</pub-id></nlm-citation></ref><ref id="ref133"><label>133</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ignjatovi&#x0107;</surname><given-names>A</given-names> </name><name name-style="western"><surname>Stevanovi&#x0107;</surname><given-names>L</given-names> </name></person-group><article-title>Efficacy and limitations of ChatGPT as a biostatistical problem-solving tool in medical education in Serbia: a descriptive study</article-title><source>J Educ Eval Health Prof</source><year>2023</year><month>10</month><day>16</day><volume>20</volume><issue>28</issue><fpage>28</fpage><pub-id pub-id-type="doi">10.3352/jeehp.2023.20.28</pub-id></nlm-citation></ref><ref id="ref134"><label>134</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Agarwal</surname><given-names>M</given-names> </name><name name-style="western"><surname>Goswami</surname><given-names>A</given-names> </name><name name-style="western"><surname>Sharma</surname><given-names>P</given-names> </name></person-group><article-title>Evaluating ChatGPT-3.5 and Claude-2 in answering and explaining conceptual medical physiology multiple-choice questions</article-title><source>Cureus</source><year>2023</year><month>09</month><volume>15</volume><issue>9</issue><fpage>e46222</fpage><pub-id pub-id-type="doi">10.7759/cureus.46222</pub-id><pub-id pub-id-type="medline">37908959</pub-id></nlm-citation></ref><ref id="ref135"><label>135</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yanagita</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Yokokawa</surname><given-names>D</given-names> </name><name name-style="western"><surname>Fukuzawa</surname><given-names>F</given-names> </name><name name-style="western"><surname>Uchida</surname><given-names>S</given-names> </name><name name-style="western"><surname>Uehara</surname><given-names>T</given-names> </name><name name-style="western"><surname>Ikusaka</surname><given-names>M</given-names> </name></person-group><article-title>Expert assessment of ChatGPT&#x2019;s ability to generate illness scripts: an evaluative study</article-title><source>BMC Med Educ</source><year>2024</year><month>05</month><day>15</day><volume>24</volume><issue>1</issue><fpage>536</fpage><pub-id pub-id-type="doi">10.1186/s12909-024-05534-8</pub-id><pub-id pub-id-type="medline">38750546</pub-id></nlm-citation></ref><ref id="ref136"><label>136</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sauder</surname><given-names>M</given-names> </name><name name-style="western"><surname>Tritsch</surname><given-names>T</given-names> </name><name name-style="western"><surname>Rajput</surname><given-names>V</given-names> </name><name name-style="western"><surname>Schwartz</surname><given-names>G</given-names> </name><name name-style="western"><surname>Shoja</surname><given-names>MM</given-names> </name></person-group><article-title>Exploring generative artificial intelligence-assisted medical education: assessing case-based learning for medical students</article-title><source>Cureus</source><year>2024</year><month>01</month><volume>16</volume><issue>1</issue><fpage>e51961</fpage><pub-id pub-id-type="doi">10.7759/cureus.51961</pub-id><pub-id pub-id-type="medline">38333501</pub-id></nlm-citation></ref><ref id="ref137"><label>137</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hanna</surname><given-names>RE</given-names> </name><name name-style="western"><surname>Smith</surname><given-names>LR</given-names> </name><name name-style="western"><surname>Mhaskar</surname><given-names>R</given-names> </name><name name-style="western"><surname>Hanna</surname><given-names>K</given-names> </name></person-group><article-title>Performance of language models on the family medicine in-training exam</article-title><source>Fam Med</source><year>2024</year><month>10</month><volume>56</volume><issue>9</issue><fpage>555</fpage><lpage>560</lpage><pub-id pub-id-type="doi">10.22454/FamMed.2024.233738</pub-id><pub-id pub-id-type="medline">39207788</pub-id></nlm-citation></ref><ref id="ref138"><label>138</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Takahashi</surname><given-names>H</given-names> </name><name name-style="western"><surname>Shikino</surname><given-names>K</given-names> </name><name name-style="western"><surname>Kondo</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Educational utility of clinical vignettes generated in Japanese by ChatGPT-4: mixed methods study</article-title><source>JMIR Med Educ</source><year>2024</year><month>08</month><day>13</day><volume>10</volume><fpage>e59133</fpage><pub-id pub-id-type="doi">10.2196/59133</pub-id><pub-id pub-id-type="medline">39137031</pub-id></nlm-citation></ref><ref id="ref139"><label>139</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Waikel</surname><given-names>RL</given-names> </name><name name-style="western"><surname>Othman</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Patel</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Recognition of genetic conditions after learning with images created using generative artificial intelligence</article-title><source>JAMA Netw Open</source><year>2024</year><month>03</month><day>4</day><volume>7</volume><issue>3</issue><fpage>e242609</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2024.2609</pub-id><pub-id pub-id-type="medline">38488790</pub-id></nlm-citation></ref><ref id="ref140"><label>140</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Collins</surname><given-names>BR</given-names> </name><name name-style="western"><surname>Black</surname><given-names>EW</given-names> </name><name name-style="western"><surname>Rarey</surname><given-names>KE</given-names> </name></person-group><article-title>Introducing AnatomyGPT: A customized artificial intelligence application for anatomical sciences education</article-title><source>Clin Anat</source><year>2024</year><month>09</month><volume>37</volume><issue>6</issue><fpage>661</fpage><lpage>669</lpage><pub-id pub-id-type="doi">10.1002/ca.24178</pub-id><pub-id pub-id-type="medline">38721869</pub-id></nlm-citation></ref><ref id="ref141"><label>141</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kung</surname><given-names>TH</given-names> </name><name name-style="western"><surname>Cheatham</surname><given-names>M</given-names> </name><name name-style="western"><surname>Medenilla</surname><given-names>A</given-names> </name><etal/></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Dagan</surname><given-names>A</given-names> </name></person-group><article-title>Performance of ChatGPT on USMLE: Potential for AI-assisted medical education using large language models</article-title><source>PLOS Digit Health</source><year>2023</year><month>02</month><volume>2</volume><issue>2</issue><fpage>e0000198</fpage><pub-id pub-id-type="doi">10.1371/journal.pdig.0000198</pub-id><pub-id pub-id-type="medline">36812645</pub-id></nlm-citation></ref><ref id="ref142"><label>142</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Roso&#x0142;</surname><given-names>M</given-names> </name><name name-style="western"><surname>G&#x0105;sior</surname><given-names>JS</given-names> </name><name name-style="western"><surname>&#x0141;aba</surname><given-names>J</given-names> </name><name name-style="western"><surname>Korzeniewski</surname><given-names>K</given-names> </name><name name-style="western"><surname>M&#x0142;y&#x0144;czak</surname><given-names>M</given-names> </name></person-group><article-title>Evaluation of the performance of GPT-3.5 and GPT-4 on the Polish Medical Final Examination</article-title><source>Sci Rep</source><year>2023</year><month>11</month><day>22</day><volume>13</volume><issue>1</issue><pub-id pub-id-type="doi">10.1038/s41598-023-46995-z</pub-id></nlm-citation></ref><ref id="ref143"><label>143</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Murphy Lonergan</surname><given-names>R</given-names> </name><name name-style="western"><surname>Curry</surname><given-names>J</given-names> </name><name name-style="western"><surname>Dhas</surname><given-names>K</given-names> </name><name name-style="western"><surname>Simmons</surname><given-names>BI</given-names> </name></person-group><article-title>Stratified evaluation of GPT&#x2019;s question answering in surgery reveals artificial intelligence (AI) knowledge gaps</article-title><source>Cureus</source><year>2023</year><month>11</month><volume>15</volume><issue>11</issue><fpage>e48788</fpage><pub-id pub-id-type="doi">10.7759/cureus.48788</pub-id><pub-id pub-id-type="medline">38098921</pub-id></nlm-citation></ref><ref id="ref144"><label>144</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>W&#x00F3;jcik</surname><given-names>S</given-names> </name><name name-style="western"><surname>Rulkiewicz</surname><given-names>A</given-names> </name><name name-style="western"><surname>Pruszczyk</surname><given-names>P</given-names> </name><name name-style="western"><surname>Lisik</surname><given-names>W</given-names> </name><name name-style="western"><surname>Pobo&#x017C;y</surname><given-names>M</given-names> </name><name name-style="western"><surname>Domienik-Kar&#x0142;owicz</surname><given-names>J</given-names> </name></person-group><article-title>Reshaping medical education: performance of ChatGPT on a PES medical examination</article-title><source>Cardiol J</source><year>2024</year><volume>31</volume><issue>3</issue><fpage>442</fpage><lpage>450</lpage><pub-id pub-id-type="doi">10.5603/cj.97517</pub-id><pub-id pub-id-type="medline">37830257</pub-id></nlm-citation></ref><ref id="ref145"><label>145</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Co&#x015F;kun</surname><given-names>&#x00D6;</given-names> </name><name name-style="western"><surname>K&#x0131;yak</surname><given-names>YS</given-names> </name><name name-style="western"><surname>Budako&#x011F;lu</surname><given-names>I&#x0130;</given-names> </name></person-group><article-title>ChatGPT to generate clinical vignettes for teaching and multiple-choice questions for assessment: A randomized controlled experiment</article-title><source>Med Teach</source><year>2025</year><month>02</month><volume>47</volume><issue>2</issue><fpage>268</fpage><lpage>274</lpage><pub-id pub-id-type="doi">10.1080/0142159X.2024.2327477</pub-id><pub-id pub-id-type="medline">38478902</pub-id></nlm-citation></ref><ref id="ref146"><label>146</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Knoedler</surname><given-names>L</given-names> </name><name name-style="western"><surname>Alfertshofer</surname><given-names>M</given-names> </name><name name-style="western"><surname>Knoedler</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Pure wisdom or potemkin villages? A comparison of ChatGPT 3.5 and ChatGPT 4 on USMLE step 3 style questions: quantitative analysis</article-title><source>JMIR Med Educ</source><year>2024</year><month>01</month><day>5</day><volume>10</volume><fpage>e51148</fpage><pub-id pub-id-type="doi">10.2196/51148</pub-id><pub-id pub-id-type="medline">38180782</pub-id></nlm-citation></ref><ref id="ref147"><label>147</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Uribe</surname><given-names>SE</given-names> </name><name name-style="western"><surname>Maldupa</surname><given-names>I</given-names> </name><name name-style="western"><surname>Kavadella</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Artificial intelligence chatbots and large language models in dental education: worldwide survey of educators</article-title><source>Eur J Dent Educ</source><year>2024</year><month>11</month><volume>28</volume><issue>4</issue><fpage>865</fpage><lpage>876</lpage><pub-id pub-id-type="doi">10.1111/eje.13009</pub-id><pub-id pub-id-type="medline">38586899</pub-id></nlm-citation></ref><ref id="ref148"><label>148</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jarry Trujillo</surname><given-names>C</given-names> </name><name name-style="western"><surname>Vela Ulloa</surname><given-names>J</given-names> </name><name name-style="western"><surname>Escalona Vivas</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Surgeons vs ChatGPT: assessment and feedback performance based on real surgical scenarios</article-title><source>J Surg Educ</source><year>2024</year><month>07</month><volume>81</volume><issue>7</issue><fpage>960</fpage><lpage>966</lpage><pub-id pub-id-type="doi">10.1016/j.jsurg.2024.03.012</pub-id><pub-id pub-id-type="medline">38749814</pub-id></nlm-citation></ref><ref id="ref149"><label>149</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Meo</surname><given-names>SA</given-names> </name><name name-style="western"><surname>Al-Khlaiwi</surname><given-names>T</given-names> </name><name name-style="western"><surname>AbuKhalaf</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Meo</surname><given-names>AS</given-names> </name><name name-style="western"><surname>Klonoff</surname><given-names>DC</given-names> </name></person-group><article-title>The scientific knowledge of Bard and ChatGPT in endocrinology, diabetes, and diabetes technology: multiple-choice questions examination-based performance</article-title><source>J Diabetes Sci Technol</source><year>2025</year><month>05</month><volume>19</volume><issue>3</issue><fpage>705</fpage><lpage>710</lpage><pub-id pub-id-type="doi">10.1177/19322968231203987</pub-id><pub-id pub-id-type="medline">37798960</pub-id></nlm-citation></ref><ref id="ref150"><label>150</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shamim</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Zaidi</surname><given-names>SJA</given-names> </name><name name-style="western"><surname>Rehman</surname><given-names>A</given-names> </name></person-group><article-title>The revival of essay-type questions in medical education: harnessing artificial intelligence and machine learning</article-title><source>J Coll Physicians Surg Pak</source><year>2024</year><month>05</month><volume>34</volume><issue>5</issue><fpage>595</fpage><lpage>599</lpage><pub-id pub-id-type="doi">10.29271/jcpsp.2024.05.595</pub-id><pub-id pub-id-type="medline">38720222</pub-id></nlm-citation></ref><ref id="ref151"><label>151</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Meo</surname><given-names>SA</given-names> </name><name name-style="western"><surname>Alotaibi</surname><given-names>M</given-names> </name><name name-style="western"><surname>Meo</surname><given-names>MZS</given-names> </name><name name-style="western"><surname>Meo</surname><given-names>MOS</given-names> </name><name name-style="western"><surname>Hamid</surname><given-names>M</given-names> </name></person-group><article-title>Medical knowledge of ChatGPT in public health, infectious diseases, COVID-19 pandemic, and vaccines: multiple choice questions examination based performance</article-title><source>Front Public Health</source><year>2024</year><volume>12</volume><fpage>1360597</fpage><pub-id pub-id-type="doi">10.3389/fpubh.2024.1360597</pub-id><pub-id pub-id-type="medline">38711764</pub-id></nlm-citation></ref><ref id="ref152"><label>152</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ba</surname><given-names>H</given-names> </name><name name-style="western"><surname>zhang</surname><given-names>L</given-names> </name><name name-style="western"><surname>Yi</surname><given-names>Z</given-names> </name></person-group><article-title>Enhancing clinical skills in pediatric trainees: a comparative study of ChatGPT-assisted and traditional teaching methods</article-title><source>BMC Med Educ</source><year>2024</year><month>05</month><day>22</day><volume>24</volume><issue>1</issue><pub-id pub-id-type="doi">10.1186/s12909-024-05565-1</pub-id></nlm-citation></ref><ref id="ref153"><label>153</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Almazrou</surname><given-names>S</given-names> </name><name name-style="western"><surname>Alanezi</surname><given-names>F</given-names> </name><name name-style="western"><surname>Almutairi</surname><given-names>SA</given-names> </name><etal/></person-group><article-title>Enhancing medical students critical thinking skills through ChatGPT: An empirical study with medical students</article-title><source>Nutr Health</source><year>2025</year><month>07</month><volume>31</volume><issue>3</issue><fpage>1023</fpage><lpage>1033</lpage><pub-id pub-id-type="doi">10.1177/02601060241273627</pub-id></nlm-citation></ref><ref id="ref154"><label>154</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Crawford</surname><given-names>LM</given-names> </name><name name-style="western"><surname>Hendzlik</surname><given-names>P</given-names> </name><name name-style="western"><surname>Lam</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Digital ink and surgical dreams: perceptions of artificial intelligence&#x2013;generated essays in residency applications</article-title><source>J Surg Res</source><year>2024</year><month>09</month><volume>301</volume><fpage>504</fpage><lpage>511</lpage><pub-id pub-id-type="doi">10.1016/j.jss.2024.06.020</pub-id><pub-id pub-id-type="medline">39042979</pub-id></nlm-citation></ref><ref id="ref155"><label>155</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mosleh</surname><given-names>R</given-names> </name><name name-style="western"><surname>Jarrar</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Jarrar</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Tazkarji</surname><given-names>M</given-names> </name><name name-style="western"><surname>Hawash</surname><given-names>M</given-names> </name></person-group><article-title>Medicine and pharmacy students&#x2019; knowledge, attitudes, and practice regarding artificial intelligence programs: Jordan and West Bank of Palestine</article-title><source>Adv Med Educ Pract</source><year>2023</year><volume>14</volume><fpage>1391</fpage><lpage>1400</lpage><pub-id pub-id-type="doi">10.2147/AMEP.S433255</pub-id><pub-id pub-id-type="medline">38106923</pub-id></nlm-citation></ref><ref id="ref156"><label>156</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Western</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Smit</surname><given-names>ES</given-names> </name><name name-style="western"><surname>G&#x00FC;ltzow</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Bridging the digital health divide: a narrative review of the causes, implications, and solutions for digital health inequalities</article-title><source>Health Psychol Behav Med</source><year>2025</year><volume>13</volume><issue>1</issue><fpage>2493139</fpage><pub-id pub-id-type="doi">10.1080/21642850.2025.2493139</pub-id><pub-id pub-id-type="medline">40276490</pub-id></nlm-citation></ref><ref id="ref157"><label>157</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dave</surname><given-names>T</given-names> </name><name name-style="western"><surname>Athaluri</surname><given-names>SA</given-names> </name><name name-style="western"><surname>Singh</surname><given-names>S</given-names> </name></person-group><article-title>ChatGPT in medicine: an overview of its applications, advantages, limitations, future prospects, and ethical considerations</article-title><source>Front Artif Intell</source><year>2023</year><month>05</month><day>4</day><volume>6</volume><pub-id pub-id-type="doi">10.3389/frai.2023.1169595</pub-id></nlm-citation></ref><ref id="ref158"><label>158</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>L</given-names> </name><name name-style="western"><surname>Qu</surname><given-names>S</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Global trends and hotspots of ChatGPT in medical research: a bibliometric and visualized study</article-title><source>Front Med</source><year>2024</year><month>05</month><day>16</day><volume>11</volume><pub-id pub-id-type="doi">10.3389/fmed.2024.1406842</pub-id></nlm-citation></ref><ref id="ref159"><label>159</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Khan</surname><given-names>N</given-names> </name><name name-style="western"><surname>Khan</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Koubaa</surname><given-names>A</given-names> </name><name name-style="western"><surname>Khan</surname><given-names>MK</given-names> </name><name name-style="western"><surname>Salleh</surname><given-names>R bin</given-names> </name></person-group><article-title>Global insights and the impact of generative AI-ChatGPT on multidisciplinary: a systematic review and bibliometric analysis</article-title><source>Conn Sci</source><year>2024</year><month>12</month><day>31</day><volume>36</volume><issue>1</issue><pub-id pub-id-type="doi">10.1080/09540091.2024.2353630</pub-id></nlm-citation></ref><ref id="ref160"><label>160</label><nlm-citation citation-type="web"><article-title>100+ eye-opening ChatGPT statistics: tracing the roots of generative AI to its global dominance</article-title><source>Master of Code</source><year>2025</year><month>01</month><access-date>2025-07-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://masterofcode.com/blog/chatgpt-statistics">https://masterofcode.com/blog/chatgpt-statistics</ext-link></comment></nlm-citation></ref><ref id="ref161"><label>161</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>See</surname><given-names>BH</given-names> </name><name name-style="western"><surname>Gorard</surname><given-names>S</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>B</given-names> </name><name name-style="western"><surname>Dong</surname><given-names>L</given-names> </name><name name-style="western"><surname>Siddiqui</surname><given-names>N</given-names> </name></person-group><article-title>Is technology always helpful?: A critical review of the impact on learning outcomes of education technology in supporting formative assessment in schools</article-title><source>Res Pap Educ</source><year>2022</year><month>11</month><day>2</day><volume>37</volume><issue>6</issue><fpage>1064</fpage><lpage>1096</lpage><pub-id pub-id-type="doi">10.1080/02671522.2021.1907778</pub-id></nlm-citation></ref><ref id="ref162"><label>162</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nazi</surname><given-names>ZA</given-names> </name><name name-style="western"><surname>Peng</surname><given-names>W</given-names> </name></person-group><article-title>Large language models in healthcare and medical domain: a review</article-title><source>Informatics (MDPI)</source><volume>11</volume><issue>3</issue><fpage>57</fpage><pub-id pub-id-type="doi">10.3390/informatics11030057</pub-id></nlm-citation></ref><ref id="ref163"><label>163</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Busch</surname><given-names>F</given-names> </name><name name-style="western"><surname>Hoffmann</surname><given-names>L</given-names> </name><name name-style="western"><surname>Rueger</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Current applications and challenges in large language models for patient care: a systematic review</article-title><source>Commun Med</source><year>2025</year><month>01</month><day>21</day><volume>5</volume><issue>1</issue><pub-id pub-id-type="doi">10.1038/s43856-024-00717-2</pub-id></nlm-citation></ref><ref id="ref164"><label>164</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Meyer</surname><given-names>JG</given-names> </name><name name-style="western"><surname>Urbanowicz</surname><given-names>RJ</given-names> </name><name name-style="western"><surname>Martin</surname><given-names>PCN</given-names> </name><etal/></person-group><article-title>ChatGPT and large language models in academia: opportunities and challenges</article-title><source>BioData Min</source><year>2023</year><month>07</month><day>13</day><volume>16</volume><issue>1</issue><pub-id pub-id-type="doi">10.1186/s13040-023-00339-9</pub-id></nlm-citation></ref><ref id="ref165"><label>165</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mao</surname><given-names>J</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>B</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>JC</given-names> </name></person-group><article-title>Generative artificial intelligence in education and its implications for assessment</article-title><source>TechTrends</source><year>2024</year><month>01</month><volume>68</volume><issue>1</issue><fpage>58</fpage><lpage>66</lpage><pub-id pub-id-type="doi">10.1007/s11528-023-00911-4</pub-id></nlm-citation></ref><ref id="ref166"><label>166</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Turner</surname><given-names>L</given-names> </name><name name-style="western"><surname>Hashimoto</surname><given-names>DA</given-names> </name><name name-style="western"><surname>Vasisht</surname><given-names>S</given-names> </name><name name-style="western"><surname>Schaye</surname><given-names>V</given-names> </name></person-group><article-title>Demystifying AI: current state and future role in medical education assessment</article-title><source>Acad Med</source><year>2024</year><month>04</month><day>1</day><volume>99</volume><issue>4S Suppl 1</issue><fpage>S42</fpage><lpage>S47</lpage><pub-id pub-id-type="doi">10.1097/ACM.0000000000005598</pub-id><pub-id pub-id-type="medline">38166201</pub-id></nlm-citation></ref><ref id="ref167"><label>167</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lakhtakia</surname><given-names>R</given-names> </name><name name-style="western"><surname>Otaki</surname><given-names>F</given-names> </name><name name-style="western"><surname>Alsuwaidi</surname><given-names>L</given-names> </name><name name-style="western"><surname>Zary</surname><given-names>N</given-names> </name></person-group><article-title>Assessment as learning in medical education: feasibility and perceived impact of student-generated formative assessments</article-title><source>JMIR Med Educ</source><year>2022</year><month>07</month><day>22</day><volume>8</volume><issue>3</issue><fpage>e35820</fpage><pub-id pub-id-type="doi">10.2196/35820</pub-id><pub-id pub-id-type="medline">35867379</pub-id></nlm-citation></ref><ref id="ref168"><label>168</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Machkour</surname><given-names>M</given-names> </name><name name-style="western"><surname>El Jihaoui</surname><given-names>M</given-names> </name><name name-style="western"><surname>Lamalif</surname><given-names>L</given-names> </name><name name-style="western"><surname>Faris</surname><given-names>S</given-names> </name><name name-style="western"><surname>Mansouri</surname><given-names>K</given-names> </name></person-group><article-title>Toward an adaptive learning assessment pathway</article-title><source>Front Educ</source><year>2025</year><volume>10</volume><pub-id pub-id-type="doi">10.3389/feduc.2025.1498233</pub-id></nlm-citation></ref><ref id="ref169"><label>169</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Solis Trujillo</surname><given-names>BP</given-names> </name><name name-style="western"><surname>Velarde-Camaqui</surname><given-names>D</given-names> </name><name name-style="western"><surname>Gonzales Nu&#x00F1;ez</surname><given-names>CA</given-names> </name><name name-style="western"><surname>Castillo Silva</surname><given-names>EV</given-names> </name><name name-style="western"><surname>Gonzalez Said de la Oliva</surname><given-names>M del P</given-names> </name></person-group><article-title>The current landscape of formative assessment and feedback in graduate studies: a systematic literature review</article-title><source>Front Educ</source><year>2025</year><month>05</month><day>12</day><volume>10</volume><pub-id pub-id-type="doi">10.3389/feduc.2025.1509983</pub-id></nlm-citation></ref><ref id="ref170"><label>170</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wilson</surname><given-names>C</given-names> </name><name name-style="western"><surname>Scott</surname><given-names>B</given-names> </name></person-group><article-title>Adaptive systems in education: a review and conceptual unification</article-title><source>IJILT</source><year>2017</year><month>01</month><day>3</day><volume>34</volume><issue>1</issue><fpage>2</fpage><lpage>19</lpage><pub-id pub-id-type="doi">10.1108/IJILT-09-2016-0040</pub-id></nlm-citation></ref><ref id="ref171"><label>171</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kolluru</surname><given-names>V</given-names> </name><name name-style="western"><surname>Mungara</surname><given-names>S</given-names> </name><name name-style="western"><surname>Chintakunta</surname><given-names>AN</given-names> </name></person-group><article-title>Adaptive learning systems: harnessing AI for customized educational experiences</article-title><source>IJCSITY</source><year>2018</year><month>08</month><day>30</day><access-date>2025-10-09</access-date><volume>6</volume><issue>3</issue><fpage>13</fpage><lpage>26</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://airccse.org/journal/ijcsity/Current2018.html">https://airccse.org/journal/ijcsity/Current2018.html</ext-link></comment><pub-id pub-id-type="doi">10.5121/ijcsity.2018.6302</pub-id></nlm-citation></ref><ref id="ref172"><label>172</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cross</surname><given-names>JL</given-names> </name><name name-style="western"><surname>Choma</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Onofrey</surname><given-names>JA</given-names> </name></person-group><article-title>Bias in medical AI: Implications for clinical decision-making</article-title><source>PLOS Digit Health</source><year>2024</year><month>11</month><volume>3</volume><issue>11</issue><fpage>e0000651</fpage><pub-id pub-id-type="doi">10.1371/journal.pdig.0000651</pub-id></nlm-citation></ref><ref id="ref173"><label>173</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Sawan</surname><given-names>M</given-names> </name></person-group><article-title>Balancing automation and empathy: how teachers can thrive with AI</article-title><source>Zenodo</source><comment>Preprint posted online on  May 18, 2025</comment><pub-id pub-id-type="doi">10.5281/zenodo.15456225</pub-id></nlm-citation></ref><ref id="ref174"><label>174</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bond</surname><given-names>M</given-names> </name><name name-style="western"><surname>Khosravi</surname><given-names>H</given-names> </name><name name-style="western"><surname>De Laat</surname><given-names>M</given-names> </name><etal/></person-group><article-title>A meta systematic review of artificial intelligence in higher education: a call for increased ethics, collaboration, and rigour</article-title><source>Int J Educ Technol High Educ</source><year>2024</year><month>01</month><day>19</day><volume>21</volume><issue>1</issue><pub-id pub-id-type="doi">10.1186/s41239-023-00436-z</pub-id></nlm-citation></ref><ref id="ref175"><label>175</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Resnik</surname><given-names>DB</given-names> </name><name name-style="western"><surname>Hosseini</surname><given-names>M</given-names> </name></person-group><article-title>The ethics of using artificial intelligence in scientific research: new guidance needed for a new tool</article-title><source>AI Ethics</source><year>2025</year><month>04</month><volume>5</volume><issue>2</issue><fpage>1499</fpage><lpage>1521</lpage><pub-id pub-id-type="doi">10.1007/s43681-024-00493-8</pub-id></nlm-citation></ref><ref id="ref176"><label>176</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tong</surname><given-names>D</given-names> </name><name name-style="western"><surname>Jin</surname><given-names>B</given-names> </name><name name-style="western"><surname>Tao</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Ren</surname><given-names>H</given-names> </name><name name-style="western"><surname>Atiquil Islam</surname><given-names>AYM</given-names> </name><name name-style="western"><surname>Bao</surname><given-names>L</given-names> </name></person-group><article-title>Exploring the role of human-AI collaboration in solving scientific problems</article-title><source>Phys Rev Phys Educ Res</source><year>2025</year><month>05</month><volume>21</volume><issue>1</issue><fpage>010149</fpage><pub-id pub-id-type="doi">10.1103/PhysRevPhysEducRes.21.010149</pub-id></nlm-citation></ref><ref id="ref177"><label>177</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yu</surname><given-names>S</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>SS</given-names> </name><name name-style="western"><surname>Hwang</surname><given-names>H</given-names> </name></person-group><article-title>The ethics of using artificial intelligence in medical research</article-title><source>KMJ</source><year>2024</year><month>12</month><volume>39</volume><issue>4</issue><fpage>229</fpage><lpage>237</lpage><pub-id pub-id-type="doi">10.7180/kmj.24.140</pub-id></nlm-citation></ref><ref id="ref178"><label>178</label><nlm-citation citation-type="book"><source>Web-Based Medical Teaching Using a Multi-Agent System Applications and Innovations in Intelligent Systems XIII</source><publisher-name>Springer London</publisher-name><fpage>181</fpage><lpage>194</lpage><pub-id pub-id-type="doi">10.1007/1-84628-224-1_14</pub-id><pub-id pub-id-type="other">978-1-84628-223-2</pub-id></nlm-citation></ref><ref id="ref179"><label>179</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Wei</surname><given-names>H</given-names> </name><name name-style="western"><surname>Qiu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>H</given-names> </name><name name-style="western"><surname>Yuan</surname><given-names>W</given-names> </name></person-group><article-title>MEDCO: medical education copilots based on a multi-agent framework</article-title><source>arXiv</source><comment>Preprint posted online on  Aug 22, 2024</comment><pub-id pub-id-type="doi">10.48550/ARXIV.2408.12496</pub-id></nlm-citation></ref><ref id="ref180"><label>180</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>F</given-names> </name><name name-style="western"><surname>Zhou</surname><given-names>H</given-names> </name><name name-style="western"><surname>Gu</surname><given-names>B</given-names> </name><etal/></person-group><article-title>Application of large language models in medicine</article-title><source>Nat Rev Bioeng</source><year>2025</year><access-date>2025-07-12</access-date><volume>3</volume><issue>6</issue><fpage>445</fpage><lpage>464</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://www.nature.com/articles/s44222-025-00279-5">https://www.nature.com/articles/s44222-025-00279-5</ext-link></comment><pub-id pub-id-type="doi">10.1038/s44222-025-00279-5</pub-id></nlm-citation></ref><ref id="ref181"><label>181</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>K</given-names> </name><name name-style="western"><surname>Meng</surname><given-names>X</given-names> </name><name name-style="western"><surname>Yan</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Revolutionizing health care: the transformative impact of large language models in medicine</article-title><source>J Med Internet Res</source><year>2025</year><month>01</month><day>7</day><volume>27</volume><fpage>e59069</fpage><pub-id pub-id-type="doi">10.2196/59069</pub-id><pub-id pub-id-type="medline">39773666</pub-id></nlm-citation></ref><ref id="ref182"><label>182</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hasanzadeh</surname><given-names>F</given-names> </name><name name-style="western"><surname>Josephson</surname><given-names>CB</given-names> </name><name name-style="western"><surname>Waters</surname><given-names>G</given-names> </name><name name-style="western"><surname>Adedinsewo</surname><given-names>D</given-names> </name><name name-style="western"><surname>Azizi</surname><given-names>Z</given-names> </name><name name-style="western"><surname>White</surname><given-names>JA</given-names> </name></person-group><article-title>Bias recognition and mitigation strategies in artificial intelligence healthcare applications</article-title><source>NPJ Digit Med</source><year>2025</year><month>03</month><day>11</day><volume>8</volume><issue>1</issue><fpage>154</fpage><pub-id pub-id-type="doi">10.1038/s41746-025-01503-7</pub-id><pub-id pub-id-type="medline">40069303</pub-id></nlm-citation></ref><ref id="ref183"><label>183</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>H</given-names> </name><name name-style="western"><surname>Li</surname><given-names>C</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Review on security of federated learning and its application in healthcare</article-title><source>Future Generation Computer Systems</source><year>2023</year><month>07</month><volume>144</volume><fpage>271</fpage><lpage>290</lpage><pub-id pub-id-type="doi">10.1016/j.future.2023.02.021</pub-id></nlm-citation></ref><ref id="ref184"><label>184</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hu</surname><given-names>F</given-names> </name><name name-style="western"><surname>Qiu</surname><given-names>S</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>C</given-names> </name><name name-style="western"><surname>Nunes</surname><given-names>MB</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>H</given-names> </name></person-group><article-title>Privacy-preserving healthcare and medical data collaboration service system based on blockchain and federated learning</article-title><source>CMC</source><year>2024</year><volume>80</volume><issue>2</issue><fpage>2897</fpage><lpage>2915</lpage><pub-id pub-id-type="doi">10.32604/cmc.2024.052570</pub-id></nlm-citation></ref><ref id="ref185"><label>185</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ozer</surname><given-names>M</given-names> </name></person-group><article-title>The Matthew Effect in Turkish Education System</article-title><source>BUJFED</source><year>2024</year><month>11</month><day>13</day><pub-id pub-id-type="doi">10.14686/buefad.1359312</pub-id></nlm-citation></ref><ref id="ref186"><label>186</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lucchi</surname><given-names>N</given-names> </name></person-group><article-title>ChatGPT: a case study on copyright challenges for generative artificial intelligence systems</article-title><source>Eur j risk regul</source><year>2024</year><month>09</month><volume>15</volume><issue>3</issue><fpage>602</fpage><lpage>624</lpage><pub-id pub-id-type="doi">10.1017/err.2023.59</pub-id></nlm-citation></ref><ref id="ref187"><label>187</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mitra</surname><given-names>A</given-names> </name><name name-style="western"><surname>Mawson</surname><given-names>A</given-names> </name></person-group><article-title>Neglected tropical diseases: epidemiology and global burden</article-title><source>TropicalMed</source><year>2017</year><month>08</month><day>5</day><volume>2</volume><issue>3</issue><fpage>36</fpage><pub-id pub-id-type="doi">10.3390/tropicalmed2030036</pub-id></nlm-citation></ref><ref id="ref188"><label>188</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Paranjape</surname><given-names>K</given-names> </name><name name-style="western"><surname>Schinkel</surname><given-names>M</given-names> </name><name name-style="western"><surname>Nannan Panday</surname><given-names>R</given-names> </name><name name-style="western"><surname>Car</surname><given-names>J</given-names> </name><name name-style="western"><surname>Nanayakkara</surname><given-names>P</given-names> </name></person-group><article-title>Introducing artificial intelligence training in medical education</article-title><source>JMIR Med Educ</source><year>2019</year><month>12</month><day>3</day><volume>5</volume><issue>2</issue><fpage>e16048</fpage><pub-id pub-id-type="doi">10.2196/16048</pub-id><pub-id pub-id-type="medline">31793895</pub-id></nlm-citation></ref><ref id="ref189"><label>189</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Talib</surname><given-names>ZM</given-names> </name><name name-style="western"><surname>Kiguli-Malwadde</surname><given-names>E</given-names> </name><name name-style="western"><surname>Wohltjen</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Transforming health professions&#x2019; education through in-country collaboration: examining the consortia among African medical schools catalyzed by the Medical Education Partnership Initiative</article-title><source>Hum Resour Health</source><year>2015</year><month>12</month><volume>13</volume><issue>1</issue><pub-id pub-id-type="doi">10.1186/1478-4491-13-1</pub-id></nlm-citation></ref><ref id="ref190"><label>190</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ueda</surname><given-names>D</given-names> </name><name name-style="western"><surname>Kakinuma</surname><given-names>T</given-names> </name><name name-style="western"><surname>Fujita</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Fairness of artificial intelligence in healthcare: review and recommendations</article-title><source>Jpn J Radiol</source><year>2024</year><month>01</month><volume>42</volume><issue>1</issue><fpage>3</fpage><lpage>15</lpage><pub-id pub-id-type="doi">10.1007/s11604-023-01474-3</pub-id></nlm-citation></ref><ref id="ref191"><label>191</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bui</surname><given-names>TTU</given-names> </name><name name-style="western"><surname>Tong</surname><given-names>TVA</given-names> </name></person-group><article-title>The impact of AI writing tools on academic integrity: unveiling English-majored students&#x2019; perceptions and practical solutions</article-title><source>acoj</source><year>2025</year><month>01</month><day>27</day><access-date>2025-10-09</access-date><volume>16</volume><issue>1</issue><fpage>83</fpage><lpage>110</lpage><comment><ext-link ext-link-type="uri" xlink:href="http://asiacall-acoj.org/index.php/journal/issue/view/7">http://asiacall-acoj.org/index.php/journal/issue/view/7</ext-link></comment><pub-id pub-id-type="doi">10.54855/acoj.251615</pub-id></nlm-citation></ref><ref id="ref192"><label>192</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yoo</surname><given-names>JH</given-names> </name></person-group><article-title>Defining the boundaries of AI use in scientific writing: a comparative review of editorial policies</article-title><source>J Korean Med Sci</source><year>2025</year><month>06</month><day>16</day><volume>40</volume><issue>23</issue><fpage>e187</fpage><pub-id pub-id-type="doi">10.3346/jkms.2025.40.e187</pub-id><pub-id pub-id-type="medline">40524628</pub-id></nlm-citation></ref><ref id="ref193"><label>193</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schwartzstein</surname><given-names>RM</given-names> </name></person-group><article-title>Clinical reasoning and artificial intelligence: Can AI really think</article-title><source>Trans Am Clin Climatol Assoc</source><year>2024</year><volume>134</volume><fpage>133</fpage><lpage>145</lpage><pub-id pub-id-type="medline">39135584</pub-id></nlm-citation></ref><ref id="ref194"><label>194</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Jeong</surname><given-names>H</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Medical hallucinations in foundation models and their impact on healthcare</article-title><source>arXiv</source><comment>Preprint posted online on  Feb 26, 2025</comment><pub-id pub-id-type="doi">10.48550/arXiv.2503.05777</pub-id></nlm-citation></ref><ref id="ref195"><label>195</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alkhanbouli</surname><given-names>R</given-names> </name><name name-style="western"><surname>Matar Abdulla Almadhaani</surname><given-names>H</given-names> </name><name name-style="western"><surname>Alhosani</surname><given-names>F</given-names> </name><name name-style="western"><surname>Simsekler</surname><given-names>MCE</given-names> </name></person-group><article-title>The role of explainable artificial intelligence in disease prediction: a systematic literature review and future research directions</article-title><source>BMC Med Inform Decis Mak</source><year>2025</year><volume>25</volume><issue>1</issue><pub-id pub-id-type="doi">10.1186/s12911-025-02944-6</pub-id></nlm-citation></ref><ref id="ref196"><label>196</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cohen</surname><given-names>IG</given-names> </name><name name-style="western"><surname>Babic</surname><given-names>B</given-names> </name><name name-style="western"><surname>Gerke</surname><given-names>S</given-names> </name><name name-style="western"><surname>Xia</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Evgeniou</surname><given-names>T</given-names> </name><name name-style="western"><surname>Wertenbroch</surname><given-names>K</given-names> </name></person-group><article-title>How AI can learn from the law: putting humans in the loop only on appeal</article-title><source>npj Digit Med</source><year>2023</year><month>08</month><day>25</day><volume>6</volume><issue>1</issue><pub-id pub-id-type="doi">10.1038/s41746-023-00906-8</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Technical features and application comparison of mainstream generative artificial intelligence (GAI) models.</p><media xlink:href="mededu_v11i1e71125_app1.docx" xlink:title="DOCX File, 18 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Search strategy.</p><media xlink:href="mededu_v11i1e71125_app2.doc" xlink:title="DOC File, 58 KB"/></supplementary-material><supplementary-material id="app3"><label>Checklist 1</label><p>PRISMA-ScR checklist.</p><media xlink:href="mededu_v11i1e71125_app3.docx" xlink:title="DOCX File, 67 KB"/></supplementary-material></app-group></back></article>