<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Educ</journal-id><journal-id journal-id-type="publisher-id">mededu</journal-id><journal-id journal-id-type="index">20</journal-id><journal-title>JMIR Medical Education</journal-title><abbrev-journal-title>JMIR Med Educ</abbrev-journal-title><issn pub-type="epub">2369-3762</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v12i1e81264</article-id><article-id pub-id-type="doi">10.2196/81264</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Comparing AI-Assisted Problem-Solving Ability With Internet Search Engine and e-Books in Medical Students With Variable Prior Subject Knowledge: Cross-Sectional Study</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Xavier</surname><given-names>Ajiith</given-names></name><degrees>MBBS, MD</degrees><xref ref-type="aff" rid="aff1"/><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" corresp="yes" equal-contrib="yes"><name name-style="western"><surname>Naeem</surname><given-names>Syed Shariq</given-names></name><degrees>MBBS, MD, DM</degrees><xref ref-type="aff" rid="aff1"/><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Rizwi</surname><given-names>Waseem</given-names></name><degrees>MBBS, MD, PhD</degrees><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><name name-style="western"><surname>Rabha</surname><given-names>Hiramani</given-names></name><degrees>MBBS, MD</degrees><xref ref-type="aff" rid="aff1"/></contrib></contrib-group><aff id="aff1"><institution>Department of Pharmacology, Jawaharlal Nehru Medical College and Hospital, Aligarh Muslim University</institution><addr-line>Medical Road</addr-line><addr-line>Aligarh</addr-line><addr-line>Uttar Pradesh</addr-line><country>India</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Gentges</surname><given-names>Joshua</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Chartash</surname><given-names>David</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Santos-Gago</surname><given-names>Juan M</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Sakaguchi</surname><given-names>Kota</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Syed Shariq Naeem, MBBS, MD, DM, Department of Pharmacology, Jawaharlal Nehru Medical College and Hospital, Aligarh Muslim University, Medical Road, Aligarh, Uttar Pradesh, 202001, India, 91 9634912166; <email>syedshariq1@gmail.com</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>6</day><month>1</month><year>2026</year></pub-date><volume>12</volume><elocation-id>e81264</elocation-id><history><date date-type="received"><day>25</day><month>07</month><year>2025</year></date><date date-type="rev-recd"><day>04</day><month>11</month><year>2025</year></date><date date-type="accepted"><day>06</day><month>11</month><year>2025</year></date></history><copyright-statement>&#x00A9; Ajiith Xavier, Syed Shariq Naeem, Waseem Rizwi, Hiramani Rabha. Originally published in JMIR Medical Education (<ext-link ext-link-type="uri" xlink:href="https://mededu.jmir.org">https://mededu.jmir.org</ext-link>), 6.1.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Education, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://mededu.jmir.org/">https://mededu.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://mededu.jmir.org/2026/1/e81264"/><abstract><sec><title>Background</title><p>Artificial intelligence (AI), particularly large language models (LLMs) such as ChatGPT (OpenAI), is rapidly influencing medical education. Its effectiveness for students with varying levels of prior knowledge remains underexplored.</p></sec><sec><title>Objective</title><p>This study aimed to evaluate the performance of medical students with and without formal pharmacology knowledge when using AI-LLM GPTs, internet search engines, e-books, or self-knowledge to solve multiple-choice questions (MCQs).</p></sec><sec sec-type="methods"><title>Methods</title><p>A cross-sectional study was conducted at a tertiary care teaching hospital with 100 medical students, divided into a &#x201C;naive&#x201D; group (n=50; no pharmacology training) and a &#x201C;learned&#x201D; group (n=50; completed pharmacology training). The study was started after approval from the Institutional Ethics Committee of Jawaharlal Nehru Medical College Hospital, Aligarh Muslim University (1018/IEC/23/8/23). Each participant answered 4 sets of 20 MCQs using self-knowledge, e-books, Google, or ChatGPT-4o. Scores were compared using analysis of covariance with self-knowledge scores as a covariate.</p></sec><sec sec-type="results"><title>Results</title><p>Learned students significantly outperformed naive students across all methods (<italic>P</italic>&#x003C;.001), with the largest effect size in the AI-LLM GPT set (partial &#x03B7;&#x00B2;=0.328). For both groups, the performance hierarchy was AI-LLM GPT &#x003E; internet search engine &#x003E; self-knowledge &#x2248; e-books. Notably, the naive students who used AI scored higher (mean 13.24, SD 3.31) than the learned students who used Google (mean 12.14, SD 2.01; <italic>P</italic>=.01) or e-books (mean 10.22, SD 3.12; <italic>P</italic>&#x003C;.001).</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>AI-LLM GPTs can significantly enhance problem-solving performance in MCQ-based assessments, particularly for students with limited prior knowledge, even allowing them to outperform knowledgeable peers using traditional digital resources. This underscores the potential of AI to transform learning support in medical education, although its impact on deep learning and critical thinking requires further investigation.</p></sec></abstract><kwd-group><kwd>artificial intelligence</kwd><kwd>AI</kwd><kwd>large language models</kwd><kwd>LLM</kwd><kwd>medical education</kwd><kwd>ChatGPT</kwd><kwd>cognitive performance</kwd><kwd>subject-naive learners</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Artificial intelligence (AI) is the ability of a digital computer or computer-controlled robot to perform tasks commonly associated with intelligent beings [<xref ref-type="bibr" rid="ref1">1</xref>]. This includes the ability to reason, discover meaning, generalize, and learn from past experiences [<xref ref-type="bibr" rid="ref2">2</xref>]. Since the development of digital computers in the 1940s, it has been demonstrated that computers can be programmed to perform extremely complex tasks, such as proving mathematical theorems or playing chess, with great proficiency [<xref ref-type="bibr" rid="ref3">3</xref>]. AI involves the science and engineering of creating systems capable of performing tasks that require humanlike intelligence, including learning, judgment, and decision-making [<xref ref-type="bibr" rid="ref4">4</xref>]. AI has successfully solved complex problems in various domains, including education. The application of AI in natural language processing has led to the creation of intelligent chatbots and virtual assistants capable of understanding and producing human language [<xref ref-type="bibr" rid="ref5">5</xref>].</p><p>Popenici and Kerr [<xref ref-type="bibr" rid="ref6">6</xref>] investigated the impact of AI systems on learning and teaching, highlighting potential conflicts between students and instructors, such as privacy concerns, changes in power structures, and excessive control. These studies have called for further research into the impact of AI systems on learner-instructor interactions to identify gaps, issues, or barriers that prevent AI systems from achieving their intended potential [<xref ref-type="bibr" rid="ref7">7</xref>].</p><p>In the modern era of education, technology has become an integral part of the learning process. The advent of advanced language models such as ChatGPT (OpenAI), along with the vast availability of information on platforms such as Google and e-books, enables educators to enhance students&#x2019; educational experiences [<xref ref-type="bibr" rid="ref7">7</xref>].</p><p>Medical education demands not only the acquisition of factual knowledge but also the development of critical thinking and decision-making skills [<xref ref-type="bibr" rid="ref8">8</xref>]. However, the effectiveness of AI&#x2013;large language model (LLM) GPT&#x2013;driven tools in enhancing these competencies remains underexplored, particularly concerning the prior knowledge of learners [<xref ref-type="bibr" rid="ref9">9</xref>]. Students with strong foundational knowledge can use AI tools to deepen their understanding and sharpen their reasoning. In contrast, those with less prior knowledge may use them to fill gaps in their learning or face some difficulties in comprehension [<xref ref-type="bibr" rid="ref10">10</xref>].</p><p>This study used ChatGPT-4o as the representative AI-LLM GPT tool for 2 reasons. First, ChatGPT was widely accessible to students at the time of study and required minimal technical expertise. Second, it represents the current generation of general-purpose LLMs that students are likely to encounter in real-world educational settings. The most notable advantage is its breadth of training data, which expanded from 175 billion parameters in GPT-3.5 to 1 trillion in the GPT-4.0 model [<xref ref-type="bibr" rid="ref11">11</xref>]. Bing&#x2019;s current AI model has 175 billion parameters, and Microsoft&#x2019;s Bard has 540 billion in comparison [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. The domain-specific LLMs, enriched with pharmacology databases or specialized medical AI agents, may offer better performance characteristics, but widespread use of such tools is still limited due to paywall and validation issues.</p><p>The aim of this study is to compare the effectiveness of AI-LLM GPT tools (ChatGPT-4o), internet search engines (Google), e-books, and self-knowledge for answering pharmacology multiple-choice questions (MCQs) among medical students with different levels of prior pharmacology knowledge (naive vs learned groups). The study explores the assistance provided by AI-LLM GPT tools in the ability of problem solving using a cross-sectional design.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Ethical Considerations</title><p>This was a cross-sectional study conducted at a tertiary care teaching hospital. The study was started after approval from the Institutional Ethics Committee of Jawaharlal Nehru Medical College Hospital, Aligarh Muslim University (1018/IEC/23/8/23). All participants were adult MBBS students and provided written informed consent after receiving information about the study purpose and procedures. Data were collected anonymously using coded identifiers. No personal or identifiable information was recorded or published. Participants received no monetary or academic compensation.</p></sec><sec id="s2-2"><title>Setting and Participants</title><p>Participants included 50 second-year medical students who had just joined the second year and 50 third-year students who had recently passed their second year (ie, N=100). The second-year students, designated as the &#x201C;naive group,&#x201D; had no prior formal exposure to pharmacology coursework. The third-year students, designated as the &#x201C;learned group,&#x201D; had completed a comprehensive 1-year pharmacology curriculum during their second year. This curriculum consisted of 80 hours of didactic lectures, 150 hours of interactive teaching, including practical laboratory sessions, case-based learning modules, self-directed learning modules, short group teaching, and regular assessments, including sessional and professional examinations. Students had completed this coursework approximately 2&#x2010;3 months prior to participation in this study. The curriculum covered topics such as general pharmacology, autonomic pharmacology, cardiovascular drugs, and antimicrobials, aligned with the medical council syllabus for undergraduate medical education. All learned group participants had passed their second-year pharmacology examination with a minimum score of 50%.</p></sec><sec id="s2-3"><title>Study Development</title><p>Prior to the assessment, all participants received a 15-minute standardized orientation session on using ChatGPT and were provided with an eBook of Pharmacology. This training covered basic prompt formulation and how to ask follow-up questions. Students accessed ChatGPT through computer workstations in a controlled examination hall environment to ensure standardized conditions. For the Google search set, students used desktop computers with standard Google Chrome or Mozilla Firefox browsers. For the e-book set, students were provided with PDF versions of a pharmacology textbook accessible on the same computers. The training session was conducted using a standardized presentation to maintain homogeneity of assistance tool exposure. The self-knowledge set required no external tools. All sessions were proctored to ensure compliance with assigned methods for each question set.</p><p>The 80 MCQs were divided into four parallel sets (A, B, C, and D), each containing 20 questions. To ensure equivalence across sets, questions were matched for content area coverage (eg, autonomic, cardiovascular, and chemotherapy) [<xref ref-type="bibr" rid="ref1">1</xref>], question type (theory, calculation, or image-based) [<xref ref-type="bibr" rid="ref2">2</xref>], and estimated difficulty level based on faculty assessment [<xref ref-type="bibr" rid="ref3">3</xref>].</p><p>Students had 15 minutes to respond to each set of questions. They were instructed to respond to the questions in a manner that self-knowledge was used to answer questions in set A; e-books were used to answer questions in set B; internet search engine (Google) was used to answer questions in set C; and AI-LLM GPT (ChatGPT) was used to answer questions in set D. Each correct answer was given 1 mark, and no negative marking was given. The methodology flowchart of this study is shown in <xref ref-type="fig" rid="figure1">Figure 1</xref>.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Methodology flowchart.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="mededu_v12i1e81264_fig01.png"/></fig></sec><sec id="s2-4"><title>Statistical Analysis</title><p>Data analysis was done using SPSS (version 23; IBM Corp) and R software package (R Foundation for Statistical Computing). The mean (the average number of correctly answered questions out of the 20 MCQs included in each augmentation set such as self-knowledge, e-book, internet search engine, and GPT-4o) between different groups was assessed using the independent test. Intergroup and intragroup comparisons were conducted using analysis of covariance (ANCOVA), with self-knowledge group (set A) being a covariate. A <italic>P</italic> value &#x003C;.05 was considered to indicate statistical significance.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><p>The intergroup comparison between the learned and naive student groups was analyzed using ANCOVA. The estimated marginal means, partial &#x03B7;&#x00B2; values, and statistical significance for each group are presented in <xref ref-type="table" rid="table1">Table 1</xref>. The self-knowledge set was used as a covariate in the analysis to control for baseline differences in knowledge across the sets. This approach allowed for a more accurate assessment of the effects of the augmented resources methods (ChatGPT-4o, Google, and e-books) on student performance.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Intergroup comparison between the learned and naive using analysis of covariance (N=100).</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom" colspan="2">Augmentation resource and group</td><td align="left" valign="bottom">Score, mean (SD)</td><td align="left" valign="bottom">Estimated marginal mean</td><td align="left" valign="bottom">Partial &#x03B7;&#x00B2;</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="4">AI<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup>-LLM<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup> GPT (ChatGPT-4o)</td><td align="char" char="." valign="top">0.328</td><td align="char" char="." valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Naive</td><td align="left" valign="top">13.24 (3.31)</td><td align="left" valign="top">13.18</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Learned</td><td align="left" valign="top">15.42 (1.89)</td><td align="left" valign="top">15.48</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">Internet search engine (Google)</td><td align="char" char="." valign="top">0.241</td><td align="char" char="." valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Naive</td><td align="left" valign="top">10.82 (2.13)</td><td align="left" valign="top">10.76</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Learned</td><td align="left" valign="top">12.14 (2.01)</td><td align="left" valign="top">12.20</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="4">e-Books</td><td align="char" char="." valign="top">0.195</td><td align="char" char="." valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Naive</td><td align="left" valign="top">5.82 (2.77)</td><td align="left" valign="top">5.78</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Learned</td><td align="left" valign="top">10.22 (3.12)</td><td align="left" valign="top">10.26</td><td align="left" valign="top"/><td align="left" valign="top"/></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>AI: artificial intelligence.</p></fn><fn id="table1fn2"><p><sup>b</sup>LLM: large language model.</p></fn></table-wrap-foot></table-wrap><p>The analysis of estimated marginal means revealed that the learned students consistently outperformed the naive students across all sets. In the AI-LLM GPT (ChatGPT-4o) set, the learned students achieved an estimated marginal mean of 15.48 compared to 13.18 for the naive students, with a large effect size (partial &#x03B7;&#x00B2;=0.328, <italic>P</italic>&#x003C;.001). In the internet search engine (Google) set, the estimated marginal mean for the learned students was 12.20, whereas the naive students scored 10.76, with a moderate effect size (partial &#x03B7;&#x00B2;=0.241; <italic>P</italic>&#x003C;.001). The learned students in the e-book set had an estimated marginal mean of 10.26, whereas the naive students had 5.78, a moderate effect size (partial n<sup>2</sup>=0.195; <italic>P</italic>&#x003C;.001).</p><p>The post hoc analysis for the naive group shows that the AI-LLM GPT-assisted method resulted in the highest performance when compared to other methods like internet search engine&#x2013;based learning, self-knowledge, and e-books methods. A significant difference was found in all pairwise comparisons (<italic>P</italic>&#x003C;.001) except for e-books versus self-knowledge, which was not statistically significant (mean difference=&#x2212;0.30; <italic>P</italic>=.91). The performance hierarchy observed was AI-LLM GPT versus self-knowledge (<italic>P</italic>&#x003C;.001) <bold>&#x003E;</bold> internet search engine versus self-knowledge (<italic>P</italic>&#x003C;.001) <bold>&#x003E;</bold> self-knowledge &#x2248; e-books (<italic>P</italic>=.91), showing the superior effectiveness of AI tools for naive learners.</p><p>The post hoc analysis for the learned group shows that the AI-LLM GPT&#x2013;assisted learning method resulted in the highest performance when compared to other methods, whereas self-knowledge and e-books methods showed the lowest and statistically similar outcomes (mean difference=&#x2212;0.72, <italic>P</italic>=.33). Significant differences were observed between Google and self-knowledge sets (<italic>P</italic>=.04), ChatGPT-4o and self-knowledge sets (<italic>P</italic>&#x003C;.001), Google and e-books sets (<italic>P</italic>&#x003C;.001), ChatGPT-4o and e-books (<italic>P</italic>&#x003C;.001), and ChatGPT-4o and Google (<italic>P</italic>&#x003C;.001), indicating a superior performance across these comparisons. The overall performance hierarchy observed was: AI-LLM GPT &#x003E; internet search engine &#x003E; self-knowledge &#x2248; e-books, indicating the superior effectiveness of AI-LLM GPT in enhancing learning outcomes, even for participants with prior knowledge (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p><p>The mean comparison between the sets, as presented in <xref ref-type="fig" rid="figure2">Figure 2</xref>, highlights that learned students consistently outperformed naive students across all categories, as expected. The AI-LLM set achieved the highest performance, with a mean score of 15.3 (SD 1.776). Conversely, the lowest mean was observed in the e-books set, in which learned students scored 10.3 (SD 3.1) and naive students scored 5.7 (SD 2.7).</p><p>Interestingly, the self-knowledge sets performed better than the e-books sets, with naive group students achieving a mean score of 6.0 (SD 1.9) and learned group students scoring a mean of 10.96 (SD 2.2). This may be due to the fact that students in the e-book sets spent sufficient time searching for relevant chapters instead of focusing on answering the questions. This led to some questions being left unanswered that likely contributed to their lower overall performance.</p><p>While ANCOVA analysis confirmed that the learned students consistently outperformed the naive students when comparing the same learning method (as shown in <xref ref-type="table" rid="table1">Table 1</xref>), an important cross-method comparison emerged: the naive students who used ChatGPT-4o achieved higher scores (mean 13.2, SD 3.3) than the learned students who used self-knowledge (mean 10.96, SD 2.5), e-books (mean 10.22, SD 3.12), or Google (mean 12.14, SD 2.01). This demonstrates that the advantage conferred by using ChatGPT-4o was sufficient to overcome the knowledge gap between the naive and learned students when the latter were restricted to conventional resources.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Box-violin plot showing the mean scores in the naive and learned groups.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="mededu_v12i1e81264_fig02.png"/></fig></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>AI is changing the face of medical education, as it suggests some new solutions to the old forms of teaching, increases the educational experience, and improves the results of students [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. AI-based solutions, including LLMs, such as ChatGPT, virtual assistants, and AI-based simulation technologies, can change how medical students learn and apply their knowledge [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>].</p><p>This study found that learned students consistently outperformed naive students across all learning methods. However, the naive students who used ChatGPT-4o achieved higher scores than the learned students who used conventional resources (ie, self-knowledge, e-books, or Google), suggesting that AI-LLM tools may help bridge knowledge gaps more effectively than traditional learning resources.</p><p>Our study demonstrates that AI-powered LLMs such as ChatGPT can notably improve students&#x2019; performance on pharmacology MCQs, particularly for those without prior subject knowledge. Although our findings show that students achieved higher MCQ test scores when using ChatGPT-4o, we cannot conclude that this represents a genuine improvement in cognitive performance, critical thinking, or clinical decision-making skills. Higher scores may reflect the AI&#x2019;s ability to rapidly retrieve and present relevant information rather than deeper student understanding. The findings indicated that learned students have outperformed naive students in all 4 sets, and AI-LLM GPT recorded the best performance. The greatest effect size was observed in the AI group (partial &#x03B7;&#x00B2;=0.328), which indicates the tremendous influence of AI-LLM in ensuring the students improve their understanding and problem-solving skills. These results are consistent with those of previous research in that AI tools may enhance critical thinking and support learning under the condition that they are properly used by a student who already has a good knowledge grounding [<xref ref-type="bibr" rid="ref18">18</xref>].</p><p>As opposed to other methods, the e-books set exhibited the lowest performance. This can be explained by the fact that it takes a lot of time to navigate and search relevant information in the e-books. This reveals the difficulties of self-learning with the help of conventional digital sources, especially in the case of naive students who are probably not able to manage their time efficiently. In contrast, the self-knowledge set outperformed the e-books set, which means that dependence on inherent knowledge, although restricted to a certain extent, can be more helpful than the effective utilization of external means.</p><p>Although our quantitative data demonstrate that ChatGPT-4o enhanced student performance, particularly for naive learners, the mechanisms underlying this effectiveness warrant deeper exploration. There may be several reasons for AI-LLM GPT (ChatGPT-4o) to outperform other methods of assistance.</p><p>First, ChatGPT-4o provides immediate, targeted responses without requiring students to navigate complex search results or textbook indices. Informal feedback from participants suggested that students who used Google often struggled to identify authoritative sources among numerous search results, whereas those who used e-books spent considerable time locating relevant chapters. In contrast, ChatGPT-4o delivered direct answers to questions, reducing the cognitive load related to information seeking.</p><p>Second, ChatGPT-4o&#x2019;s conversational interface may facilitate iterative learning. Students could ask follow-up questions to clarify concepts, request examples, or seek a specific explanation for a specific MCQ&#x2014;a dynamic interaction not possible with static e-books and more efficient than reformulating multiple Google searches.</p><p>Third, the structured, synthesized format of ChatGPT-4o responses may be particularly beneficial for naive learners who lack the prior knowledge framework to evaluate and integrate fragmented information from multiple sources. ChatGPT-4o essentially predigests information, whereas Google and e-books require students to perform this synthesis themselves&#x2014;a task that may be especially challenging without foundational knowledge.</p><p>However, these remain as hypotheses. Future research should use mixed methods approaches, including think-aloud protocols during tool use, posttask interviews exploring student decision-making processes, and screen recordings analyzing search strategies and information evaluation patterns. Such qualitative data would provide richer insights into how students with different knowledge levels interact with various resources and why certain tools prove more effective. The study of recognizing the pattern of wrong responses in the AI-LLM GPTs output may also generate an &#x201C;array of errors&#x201D; for further training and improving LLMs.</p><p>These findings have substantial implications for both local and global medical education practices. In our institutional context, where students face high patient loads and limited access to senior clinicians for immediate consultation, AI-LLM GPTs could serve as readily available reference tools to support clinical decision-making during training. However, integration must be carefully structured to enhance rather than replace foundational learning.</p><p>Globally, these results are particularly relevant for resource-limited settings where access to comprehensive textbooks, updated references, and expert faculty may be constrained. AI-LLM GPTs could help democratize access to medical knowledge, potentially reducing disparities between well-resourced and under-resourced educational institutions. However, this assumes reliable internet connectivity and technological infrastructure, which remain barriers in many settings.</p><p>From a pedagogical perspective, our findings suggest a paradigm shift may be necessary in how we structure medical curricula. Rather than focusing exclusively on memorization of facts&#x2014;information that AI can rapidly retrieve&#x2014;educational programs should prioritize teaching students how to (1) formulate effective questions and search strategies, (2) critically evaluate AI-generated responses for accuracy and clinical appropriateness, (3) integrate AI-provided information with clinical context and patient-specific factors, and (4) develop metacognitive skills to recognize the limitations of both their own knowledge and AI tools.</p><p>Importantly, although AI-LLMs demonstrated effectiveness for MCQ performance, medical practice requires competencies beyond factual knowledge, including physical examination skills, procedural expertise, empathic patient communication, ethical reasoning under uncertainty, and team-based care coordination. Educational programs must ensure that AI integration enhances rather than diminishes these essential human dimensions of medical practice.</p><p>An important limitation is our focus on general-purpose ChatGPT-4o rather than specialized medical or pharmacology-specific AI agents. Domain-enriched LLMs that integrate pharmacology textbooks or medical databases may demonstrate different performance characteristics and potentially offer more accurate, context-specific responses. However, our choice reflects the current reality that most students have access to general LLMs such as ChatGPT-4o rather than specialized medical AI tools and makes the study more generalizable than using domain-enhanced LLMs. Second, the cross-sectional, single-day design prevents assessment of long-term learning outcomes, knowledge retention, or the development of clinical reasoning skills. Similarly, the sequential exposure to different resources (sets A through D) may have introduced order effects or learning transfer between sets. To minimize the learning transfer, the questions have been chosen from diverse topics and moderated to remove any repetition. However, the order effect cannot be removed completely in these types of cross-sectional&#x2013;sequential studies.</p><p>AI will be able to deliver personalized learning and adjust to the needs of students. This individualization helps the learners make their progress through their priorities, repeating difficult concepts or working through material as they become familiar with each subject [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. The AI-powered platforms can monitor student performance in real-time and can track the areas where the students might need more education or practice [<xref ref-type="bibr" rid="ref21">21</xref>]. Such benefits help achieve the speed and the depth of knowledge acquisition with a higher level of efficiency and more targeted learning [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>].</p></sec><sec id="s4-2"><title>Conclusions</title><p>To conclude, this study shows that the learned group outperformed the naive group in all sets, including AI-LLM GPT, internet search engine, e-books, and self-knowledge in problem solving. Ironically, the AI-LLM GPT naive group outperformed the problem-solving skills of even the learned group augmented with an internet search engine, showcasing the disruptive potential of AI-LLM in medical education. Further longitudinal studies examining knowledge retention, clinical reasoning development, and the ability to solve novel problems without AI assistance are needed to determine whether AI tools genuinely enhance cognitive capabilities or primarily serve as effective reference tools.</p></sec></sec></body><back><ack><p>The authors would like to express their gratitude to all the students who took part in this research. They would also like to thank Dr Binola for their constant motivation throughout the study. All authors declared that they had insufficient funding to support open access publication of this manuscript, including from affiliated organizations or institutions, funding agencies, or other organizations. JMIR Publications provided article processing fee (APF) support for the publication of this paper.</p></ack><notes><sec><title>Data Availability</title><p>The anonymized datasets generated and analyzed during this study are not publicly available due to institutional restrictions and the need to protect participant confidentiality; however, the data are available from the corresponding author on reasonable request.</p></sec></notes><fn-group><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">ANCOVA</term><def><p>analysis of covariance</p></def></def-item><def-item><term id="abb3">LLM</term><def><p>large language model</p></def></def-item><def-item><term id="abb4">MCQ</term><def><p>multiple-choice question</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Arawi</surname><given-names>T</given-names> </name><name name-style="western"><surname>El Bachour</surname><given-names>J</given-names> </name><name name-style="western"><surname>El Khansa</surname><given-names>T</given-names> </name></person-group><article-title>The fourth industrial revolution: its impact on artificial intelligence and medicine in developing countries</article-title><source>Asian Bioeth Rev</source><year>2024</year><month>05</month><day>25</day><volume>16</volume><issue>3</issue><fpage>513</fpage><lpage>526</lpage><pub-id pub-id-type="doi">10.1007/s41649-024-00284-7</pub-id><pub-id pub-id-type="medline">39022373</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sharma</surname><given-names>S</given-names> </name></person-group><article-title>Benefits or concerns of AI: a multistakeholder responsibility</article-title><source>Futures</source><year>2024</year><month>03</month><volume>157</volume><fpage>103328</fpage><pub-id pub-id-type="doi">10.1016/j.futures.2024.103328</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chaudhry</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Kazim</surname><given-names>E</given-names> </name></person-group><article-title>Artificial Intelligence in Education (AIEd): a high-level academic and industry note 2021</article-title><source>AI Ethics</source><year>2022</year><volume>2</volume><issue>1</issue><fpage>157</fpage><lpage>165</lpage><pub-id pub-id-type="doi">10.1007/s43681-021-00074-z</pub-id><pub-id pub-id-type="medline">34790953</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xu</surname><given-names>LD</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Li</surname><given-names>L</given-names> </name></person-group><article-title>Embedding blockchain technology into IoT for security: a survey</article-title><source>IEEE Internet Things J</source><year>2021</year><month>07</month><day>1</day><volume>8</volume><issue>13</issue><fpage>10452</fpage><lpage>10473</lpage><pub-id pub-id-type="doi">10.1109/JIOT.2021.3060508</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>Supriyono</collab><name name-style="western"><surname>Wibawa</surname><given-names>AP</given-names> </name><collab>Suyono</collab><name name-style="western"><surname>Kurniawan</surname><given-names>F</given-names> </name></person-group><article-title>Advancements in natural language processing: implications, challenges, and future directions</article-title><source>Telemat Inform Rep</source><year>2024</year><month>12</month><volume>16</volume><fpage>100173</fpage><pub-id pub-id-type="doi">10.1016/j.teler.2024.100173</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Popenici</surname><given-names>SA</given-names> </name><name name-style="western"><surname>Kerr</surname><given-names>S</given-names> </name></person-group><article-title>Exploring the impact of artificial intelligence on teaching and learning in higher education</article-title><source>Res Pract Technol Enhanc Learn</source><year>2017</year><volume>12</volume><issue>1</issue><fpage>22</fpage><pub-id pub-id-type="doi">10.1186/s41039-017-0062-8</pub-id><pub-id pub-id-type="medline">30595727</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ghory</surname><given-names>S</given-names> </name><name name-style="western"><surname>Ghafory</surname><given-names>H</given-names> </name></person-group><article-title>The impact of modern technology in the teaching and learning process</article-title><source>Int J Innov Res Sci Stud</source><year>2021</year><month>06</month><day>18</day><volume>4</volume><issue>3</issue><fpage>219</fpage><lpage>227</lpage><pub-id pub-id-type="doi">10.53894/ijirss.v4i3.73</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Buja</surname><given-names>LM</given-names> </name></person-group><article-title>Medical education today: all that glitters is not gold</article-title><source>BMC Med Educ</source><year>2019</year><month>04</month><day>16</day><volume>19</volume><issue>1</issue><fpage>110</fpage><pub-id pub-id-type="doi">10.1186/s12909-019-1535-9</pub-id><pub-id pub-id-type="medline">30991988</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Salih</surname><given-names>S</given-names> </name><name name-style="western"><surname>Husain</surname><given-names>O</given-names> </name><name name-style="western"><surname>Hamdan</surname><given-names>M</given-names> </name><name name-style="western"><surname>Abdelsalam</surname><given-names>S</given-names> </name><name name-style="western"><surname>Elshafie</surname><given-names>H</given-names> </name><name name-style="western"><surname>Motwakel</surname><given-names>A</given-names> </name></person-group><article-title>Transforming education with AI: a systematic review of ChatGPT&#x2019;s role in learning, academic practices, and institutional adoption</article-title><source>Res Eng</source><year>2025</year><month>03</month><volume>25</volume><fpage>103837</fpage><pub-id pub-id-type="doi">10.1016/j.rineng.2024.103837</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lawasi</surname><given-names>MC</given-names> </name><name name-style="western"><surname>Rohman</surname><given-names>VA</given-names> </name><name name-style="western"><surname>Shoreamanis</surname><given-names>M</given-names> </name></person-group><article-title>The use of AI in improving student&#x2019;s critical thinking skills</article-title><source>Proc Ser Soc Sci Humanit</source><year>2024</year><month>09</month><volume>18</volume><fpage>366</fpage><lpage>370</lpage><pub-id pub-id-type="doi">10.30595/pssh.v18i.1279</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Martindale</surname><given-names>J</given-names> </name><name name-style="western"><surname>Bizzaco</surname><given-names>M</given-names> </name></person-group><article-title>GPT-4 vs GPT-35: how much difference is there?</article-title><source>Digital Trends</source><year>2023</year><month>04</month><day>4</day><access-date>2023-07-29</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.digitaltrends.com/computing/gpt-4-vs-gpt-35">https://www.digitaltrends.com/computing/gpt-4-vs-gpt-35</ext-link></comment></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Deutscher</surname><given-names>M</given-names> </name></person-group><article-title>Microsoft researchers reveal neural network with 135B parameters</article-title><source>SiliconANGLE</source><year>2021</year><month>08</month><day>4</day><access-date>2023-07-29</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://siliconangle.com/2021/08/04/microsoft-researchers-reveal-neural-network-135b-parameters">https://siliconangle.com/2021/08/04/microsoft-researchers-reveal-neural-network-135b-parameters</ext-link></comment></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Almekinders</surname><given-names>S</given-names> </name></person-group><article-title>Google Bard PaLM update: 540 billion parameters take fight to ChatGPT</article-title><source>Techzine</source><year>2023</year><month>04</month><day>3</day><access-date>2025-12-05</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.techzine.eu/news/applications/104043/google-bard-palm-update-540-billion-parameters-take-fight-to-chatgpt/">https://www.techzine.eu/news/applications/104043/google-bard-palm-update-540-billion-parameters-take-fight-to-chatgpt/</ext-link></comment></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mir</surname><given-names>MM</given-names> </name><name name-style="western"><surname>Mir</surname><given-names>GM</given-names> </name><name name-style="western"><surname>Raina</surname><given-names>NT</given-names> </name><etal/></person-group><article-title>Application of artificial intelligence in medical education: current scenario and future perspectives</article-title><source>J Adv Med Educ Prof</source><year>2023</year><month>07</month><volume>11</volume><issue>3</issue><fpage>133</fpage><lpage>140</lpage><pub-id pub-id-type="doi">10.30476/JAMP.2023.98655.1803</pub-id><pub-id pub-id-type="medline">37469385</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nagi</surname><given-names>F</given-names> </name><name name-style="western"><surname>Salih</surname><given-names>R</given-names> </name><name name-style="western"><surname>Alzubaidi</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Applications of artificial intelligence (AI) in medical education: a scoping review</article-title><source>Stud Health Technol Inform</source><year>2023</year><month>06</month><day>29</day><volume>305</volume><fpage>648</fpage><lpage>651</lpage><pub-id pub-id-type="doi">10.3233/SHTI230581</pub-id><pub-id pub-id-type="medline">37387115</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mattas</surname><given-names>PS</given-names> </name></person-group><article-title>ChatGPT: a study of AI language processing and its implications</article-title><source>Int J Res Publ Rev</source><year>2023</year><volume>04</volume><issue>2</issue><fpage>435</fpage><lpage>440</lpage><pub-id pub-id-type="doi">10.55248/gengpi.2023.4218</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alawida</surname><given-names>M</given-names> </name><name name-style="western"><surname>Mejri</surname><given-names>S</given-names> </name><name name-style="western"><surname>Mehmood</surname><given-names>A</given-names> </name><name name-style="western"><surname>Chikhaoui</surname><given-names>B</given-names> </name><name name-style="western"><surname>Isaac Abiodun</surname><given-names>O</given-names> </name></person-group><article-title>A comprehensive study of ChatGPT: advancements, limitations, and ethical considerations in natural language processing and cybersecurity</article-title><source>Information</source><year>2023</year><volume>14</volume><issue>8</issue><fpage>462</fpage><pub-id pub-id-type="doi">10.3390/info14080462</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lijie</surname><given-names>H</given-names> </name><name name-style="western"><surname>Mat Yusoff</surname><given-names>S</given-names> </name><name name-style="western"><surname>Mohamad Marzaini</surname><given-names>AF</given-names> </name></person-group><article-title>Influence of AI-driven educational tools on critical thinking dispositions among university students in Malaysia: a study of key factors and correlations</article-title><source>Educ Inf Technol</source><year>2025</year><volume>30</volume><fpage>8029</fpage><lpage>8053</lpage><pub-id pub-id-type="doi">10.1007/s10639-024-13150-8</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Narayanan</surname><given-names>S</given-names> </name><name name-style="western"><surname>Ramakrishnan</surname><given-names>R</given-names> </name><name name-style="western"><surname>Durairaj</surname><given-names>E</given-names> </name><name name-style="western"><surname>Das</surname><given-names>A</given-names> </name></person-group><article-title>Artificial intelligence revolutionizing the field of medical education</article-title><source>Cureus</source><year>2023</year><month>11</month><day>28</day><volume>15</volume><issue>11</issue><fpage>e49604</fpage><pub-id pub-id-type="doi">10.7759/cureus.49604</pub-id><pub-id pub-id-type="medline">38161821</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jong</surname><given-names>M</given-names> </name></person-group><article-title>Transforming medical education in the AI era: balancing technological expertise with humanistic care in tomorrow&#x2019;s doctors</article-title><source>Ann Acad Med Singap</source><year>2024</year><month>12</month><day>12</day><volume>53</volume><issue>12</issue><fpage>754</fpage><lpage>757</lpage><pub-id pub-id-type="doi">10.47102/annals-acadmedsg.2024242</pub-id><pub-id pub-id-type="medline">39748174</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gligorea</surname><given-names>I</given-names> </name><name name-style="western"><surname>Cioca</surname><given-names>M</given-names> </name><name name-style="western"><surname>Oancea</surname><given-names>R</given-names> </name><name name-style="western"><surname>Gorski</surname><given-names>AT</given-names> </name><name name-style="western"><surname>Gorski</surname><given-names>H</given-names> </name><name name-style="western"><surname>Tudorache</surname><given-names>P</given-names> </name></person-group><article-title>Adaptive learning using artificial intelligence in e-learning: a literature review</article-title><source>Educ Sci</source><year>2023</year><volume>13</volume><issue>12</issue><fpage>1216</fpage><pub-id pub-id-type="doi">10.3390/educsci13121216</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ahn</surname><given-names>HY</given-names> </name></person-group><article-title>AI-powered e-learning for lifelong learners: impact on performance and knowledge application</article-title><source>Sustainability</source><year>2024</year><volume>16</volume><issue>20</issue><fpage>9066</fpage><pub-id pub-id-type="doi">10.3390/su16209066</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alqahtani</surname><given-names>T</given-names> </name><name name-style="western"><surname>Badreldin</surname><given-names>HA</given-names> </name><name name-style="western"><surname>Alrashed</surname><given-names>M</given-names> </name><etal/></person-group><article-title>The emergent role of artificial intelligence, natural learning processing, and large language models in higher education and research</article-title><source>Res Social Adm Pharm</source><year>2023</year><month>08</month><volume>19</volume><issue>8</issue><fpage>1236</fpage><lpage>1242</lpage><pub-id pub-id-type="doi">10.1016/j.sapharm.2023.05.016</pub-id><pub-id pub-id-type="medline">37321925</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Post hoc results of the naive and learned groups.</p><media xlink:href="mededu_v12i1e81264_app1.docx" xlink:title="DOCX File, 6001 KB"/></supplementary-material></app-group></back></article>