<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JME</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Educ</journal-id>
      <journal-title>JMIR Medical Education</journal-title>
      <issn pub-type="epub">2369-3762</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v11i1e85614</article-id>
      <article-id pub-id-type="pmid">41468580</article-id>
      <article-id pub-id-type="doi">10.2196/85614</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Evaluation of Few-Shot AI-Generated Feedback on Case Reports in Physical Therapy Education: Mixed Methods Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Chartash</surname>
            <given-names>David</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>El-Sobkey</surname>
            <given-names>Salwa</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Ekwueme</surname>
            <given-names>Moses</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Sudo</surname>
            <given-names>Hisaya</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution/>
            <institution>The United Graduate School of Education</institution>
            <institution>Tokyo Gakugei University</institution>
            <addr-line>4-1-1 Nukuikita-machi</addr-line>
            <addr-line>Koganei-shi</addr-line>
            <addr-line>Tokyo, 184-8501</addr-line>
            <country>Japan</country>
            <phone>81 42 329 7111</phone>
            <email>hisaya.sudo@takalab.jp</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0000-4979-0371</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Noborimoto</surname>
            <given-names>Yoko</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5917-3692</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Takahashi</surname>
            <given-names>Jun</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0006-0488-5485</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>The United Graduate School of Education</institution>
        <institution>Tokyo Gakugei University</institution>
        <addr-line>Tokyo</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Graduate School of Teacher Education</institution>
        <institution>Tokyo Gakugei University</institution>
        <addr-line>Tokyo</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Faculty of Education</institution>
        <institution>Tokyo Gakugei University</institution>
        <addr-line>Tokyo</addr-line>
        <country>Japan</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Hisaya Sudo <email>hisaya.sudo@takalab.jp</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2025</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>30</day>
        <month>12</month>
        <year>2025</year>
      </pub-date>
      <volume>11</volume>
      <elocation-id>e85614</elocation-id>
      <history>
        <date date-type="received">
          <day>10</day>
          <month>10</month>
          <year>2025</year>
        </date>
        <date date-type="rev-request">
          <day>5</day>
          <month>11</month>
          <year>2025</year>
        </date>
        <date date-type="rev-recd">
          <day>25</day>
          <month>11</month>
          <year>2025</year>
        </date>
        <date date-type="accepted">
          <day>18</day>
          <month>12</month>
          <year>2025</year>
        </date>
      </history>
      <copyright-statement>©Hisaya Sudo, Yoko Noborimoto, Jun Takahashi. Originally published in JMIR Medical Education (https://mededu.jmir.org), 30.12.2025.</copyright-statement>
      <copyright-year>2025</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Education, is properly cited. The complete bibliographic information, a link to the original publication on https://mededu.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://mededu.jmir.org/2025/1/e85614" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>While artificial intelligence (AI)–generated feedback offers significant potential to overcome constraints on faculty time and resources associated with providing personalized feedback, its perceived usefulness can be undermined by algorithm aversion. In-context learning, particularly the few-shot approach, has emerged as a promising paradigm for enhancing AI performance. However, there is limited research investigating its usefulness, especially in health profession education.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to compare the quality of AI-generated formative feedback from 2 settings, feedback generated in a zero-shot setting (hereafter, “zero-shot feedback”) and feedback generated in a few-shot setting (hereafter, “few-shot feedback”), using a mixed methods approach in Japanese physical therapy education. Additionally, we examined the effect of algorithm aversion on these 2 feedback types.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>A mixed methods study was conducted with 35 fourth-year physical therapy students (mean age 21.4, SD 0.7 years). Zero-shot feedback was created using Gemini 2.5 Pro with default settings, whereas few-shot feedback was generated by providing the same model with 9 teacher-created examples. The participants compared the quality of both feedback types using 3 methods: a direct preference question, the Feedback Perceptions Questionnaire (FPQ), and focus group interviews. Quantitative comparisons of FPQ scores were performed using the Wilcoxon signed rank test. To investigate algorithm aversion, the study examined how student perceptions changed before and after disclosure of the feedback’s identity.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Most students (26/35, 74%) preferred few-shot feedback over zero-shot feedback in terms of overall usefulness, although no significant difference was found between the 2 feedback types for the total FPQ score (<italic>P</italic>=.22). On the specific FPQ scales, few-shot feedback scored significantly higher than zero-shot feedback on fairness across all 3 items: “satisfied” (<italic>P</italic>=.02; <italic>r</italic>=0.407), “fair” (<italic>P</italic>=.04; <italic>r</italic>=0.341), and “justified” (<italic>P</italic>=.02; <italic>r</italic>=0.392). It also scored significantly higher on 1 item of the usefulness scale (“useful”; <italic>P</italic>=.02; <italic>r</italic>=0.401) and 1 item of the willingness scale (“invest a lot of effort”; <italic>P</italic>=.02; <italic>r</italic>=0.394). In contrast, zero-shot feedback scored significantly higher on the affect scale across 2 items: “successful” (<italic>P</italic>=.03; <italic>r</italic>=0.365) and “angry” (<italic>P</italic>=.008; <italic>r</italic>=0.443). Regarding algorithm aversion, evaluations for zero-shot feedback became more negative for 83% (15/18) of the items after identity disclosure, whereas positive perceptions of few-shot feedback were maintained or increased. Qualitative analysis revealed that students valued zero-shot feedback for its encouraging tone, whereas few-shot feedback was appreciated for its contextual understanding and concrete guidance for improvement.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Japanese physical therapy students perceived few-shot feedback more favorably than zero-shot feedback on case reports. This few-shot AI model shows potential to resist algorithm aversion and serves as an effective educational tool to support autonomous writing, facilitate reflection on clinical reasoning, and cultivate advanced thinking skills.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>large language models</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>AI</kwd>
        <kwd>generative artificial intelligence</kwd>
        <kwd>generative AI</kwd>
        <kwd>Gemini</kwd>
        <kwd>in-context learning</kwd>
        <kwd>few-shot setting</kwd>
        <kwd>formative feedback</kwd>
        <kwd>algorithm aversion</kwd>
        <kwd>health profession education</kwd>
        <kwd>physical therapy education</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>The integration of generative artificial intelligence (AI) into the health care sector has garnered much attention in recent years, with ongoing debates about its potential and limitations [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. These rapid advancements require a fundamental transformation of various aspects of education, such as learning goals, teachers’ roles, curriculum development, and learner assessment [<xref ref-type="bibr" rid="ref9">9</xref>]. Health profession education is no exception to this trend [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
        <p>A promising application of this transformative technology is AI-powered formative assessment for case reports, which demonstrates great potential for developing students’ clinical reasoning skills by providing adaptive, real-time, and personalized feedback. Clinical reasoning refers to the essential higher-order cognitive process that clinicians use to reach the right diagnosis and recommend the appropriate therapy [<xref ref-type="bibr" rid="ref10">10</xref>]. Traditionally, these clinical reasoning skills have been cultivated through the iterative process of discussing real cases, writing case reports, and refining them with feedback from experienced clinicians [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref12">12</xref>]. However, this traditional model faces significant logistical challenges in formal educational settings. For example, providing personalized feedback to each student in an academically diverse cohort is highly demanding on faculty time and resources, making it difficult to implement the frequent cycles of feedback and revision necessary for skill development. The use of AI technology holds significant potential for overcoming these challenges. Although a growing body of research has investigated the effectiveness of AI-powered feedback [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref16">16</xref>], few studies have focused specifically on health profession education.</p>
      </sec>
      <sec>
        <title>Related Work</title>
        <p>Formative feedback is information that modifies a learner’s thinking or behavior to improve performance [<xref ref-type="bibr" rid="ref17">17</xref>]. Recent research has explored the effectiveness of formative feedback generated by large language models (LLMs), such as ChatGPT developed by OpenAI, for enhancing students’ writing skills [<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref23">23</xref>]. Specifically, a study by Shi et al [<xref ref-type="bibr" rid="ref20">20</xref>] found that students receiving feedback from ChatGPT showed significantly higher academic writing performance compared to a control group. Indeed, the overall quality of feedback generated by LLMs has been found to be comparable to that of human experts across several criteria, including linguistic clarity and the use of technical terminology [<xref ref-type="bibr" rid="ref21">21</xref>]. However, the findings are not uniform. For instance, another study has revealed that peer-generated feedback outperformed that from ChatGPT [<xref ref-type="bibr" rid="ref22">22</xref>]. Moreover, Escalante et al [<xref ref-type="bibr" rid="ref23">23</xref>] found that, while there was no significant difference in learning outcomes between ChatGPT and human tutor feedback, each offered distinct advantages. These varied findings suggest that research in this domain is still in its early stages and the debate is ongoing. Consequently, the emerging consensus points toward a hybrid approach that combines the respective strengths of human- and AI-generated feedback rather than debating which is superior [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref24">24</xref>].</p>
        <p>Although LLMs possess extensive general knowledge, they often lack depth in specialized fields such as medicine, finance, and law. This limitation often leads to significant inaccuracies and hallucinations when asked questions that require specialized information. Dynamically injecting domain-specific knowledge in real time represents a promising solution to enhance their accuracy and reliability for these specialized tasks [<xref ref-type="bibr" rid="ref25">25</xref>]. As a viable approach to this challenge, in-context learning has become a significant new paradigm. This approach allows LLMs to make predictions by leveraging a few examples provided within the context [<xref ref-type="bibr" rid="ref26">26</xref>]. In the in-context learning framework, Brown et al [<xref ref-type="bibr" rid="ref27">27</xref>] contrasted the zero-shot setting, which relies solely on simple natural language prompts describing the task, with one-shot and few-shot settings, which provide one or several reference examples to help the model understand domain-specific context. Their findings demonstrated that providing just one or a few examples (one-shot and few-shot approaches) resulted in significantly higher performance than the zero-shot approach. A recent study by Rüdian et al [<xref ref-type="bibr" rid="ref28">28</xref>] evaluated student perceptions of LLM-generated feedback using this few-shot setting in language education. Their approach leveraged 10 pairs of existing student submissions and their corresponding teacher comments to effectively prime the LLM. This priming was further guided by the following prompt: “You are a helpful teacher who provides feedback based on the texts submitted by students. Respond from the first-person perspective.” The results showed that students reported that they could not distinguish LLM-generated feedback with the few-shot setting from feedback created by teachers. This field is still emerging, and further research is required. In particular, there is limited research comparing the quality of formative feedback generated via zero-shot versus few-shot settings. This comparison will provide crucial foundational insights for designing more effective domain-specific AI-generated feedback in education.</p>
        <p>For successful integration of LLM-based feedback systems into educational settings, identifying their usefulness and student acceptance is crucial [<xref ref-type="bibr" rid="ref28">28</xref>]. A key phenomenon in evaluating the usefulness of AI-generated feedback is “algorithm aversion” [<xref ref-type="bibr" rid="ref29">29</xref>], which refers to the tendency to prefer human advice over that of AI even when the AI’s advice is superior. To investigate the impact of algorithm aversion on AI-generated feedback, Nazaretsky et al [<xref ref-type="bibr" rid="ref30">30</xref>] examined how students’ perceptions of AI- and human-generated feedback changed before and after revealing the feedback provider’s identity. The results showed that students’ evaluations of the AI-generated feedback became significantly more negative after they were informed of its identity. A promising approach to address algorithm aversion involves integrating human educators’ input into AI-based systems. For example, a study by Zhang et al [<xref ref-type="bibr" rid="ref31">31</xref>] demonstrated that revealing the source of AI-generated feedback negatively impacted students’ perception of its genuineness, whereas the evaluation of human and AI–coproduced feedback was unaffected by the disclosure of its identity. Our human-AI hybrid methodology differs from the human and AI–coproduced approach described by Zhang et al [<xref ref-type="bibr" rid="ref31">31</xref>], in which LLMs provide suggestions only when they determine that the teacher-created feedback requires improvement. Given that final human verification of LLM outputs is essential, enhancing the AI’s output itself has the advantages of generating higher-quality feedback and reducing the burden of human review. Therefore, this study contributes to this area by examining whether AI-generated feedback from a few-shot setting demonstrates resistance to algorithm aversion.</p>
        <p>To assess the quality of AI-generated feedback on case reports, this study used the Feedback Perceptions Questionnaire (FPQ) [<xref ref-type="bibr" rid="ref32">32</xref>]. The FPQ is a multidimensional 18-item instrument (shown in <xref ref-type="table" rid="table1">Table 1</xref>) designed to measure feedback perceptions across 5 scales: fairness, usefulness, acceptance, willingness, and affect. Items were measured on a 100-mm visual analogue scale from “fully disagree” (0) to “fully agree” (100). The 3 items for negative affect (items 16-18) are reverse coded, meaning that a higher score indicates a lower level of that emotion. For example, for the negative affect item “I would feel angry if I received this feedback on my revision,” a check mark for 30 points (indicating low anger) would be reverse coded and calculated as 70 points (100 – 30 = 70) toward the overall affect score. The FPQ is a structurally valid and reliable instrument widely used in higher education research to compare perceptions of different types of feedback [<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref35">35</xref>].</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Items of the Feedback Perceptions Questionnaire [<xref ref-type="bibr" rid="ref32">32</xref>].</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="140"/>
            <col width="0"/>
            <col width="830"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Subscale</td>
                <td>Items</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">Fairness</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Item 1: “I would be satisfied with this feedback.”</p>
                    </list-item>
                    <list-item>
                      <p>Item 2: “I would consider this feedback fair.”</p>
                    </list-item>
                    <list-item>
                      <p>Item 3: “I would consider this feedback justified.”</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="3">Usefulness</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Item 4: “I would consider this feedback useful.”</p>
                    </list-item>
                    <list-item>
                      <p>Item 5: “I would consider this feedback helpful.”</p>
                    </list-item>
                    <list-item>
                      <p>Item 6: “This feedback would provide me a lot of support.”</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="3">Acceptance</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Item 7: “I would accept this feedback.”</p>
                    </list-item>
                    <list-item>
                      <p>Item 8: “I would dispute this feedback.”</p>
                    </list-item>
                    <list-item>
                      <p>Item 9: “I would reject this feedback.”</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="3">Willingness</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Item 10: “I would be willing to improve my performance.”</p>
                    </list-item>
                    <list-item>
                      <p>Item 11: “I would be willing to invest a lot of effort in my revision.”</p>
                    </list-item>
                    <list-item>
                      <p>Item 12: “I would be willing to work on further text revision assignments.”</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="4">Affect: “I would feel...if I received this feedback on my revision.”</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Positive</td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Item 13: satisfied</p>
                    </list-item>
                    <list-item>
                      <p>Item 14: confident</p>
                    </list-item>
                    <list-item>
                      <p>Item 15: successful</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Negative</td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Item 16: offended</p>
                    </list-item>
                    <list-item>
                      <p>Item 17: angry</p>
                    </list-item>
                    <list-item>
                      <p>Item 18: frustrated</p>
                    </list-item>
                  </list>
                </td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Research Objectives</title>
        <p>This study aimed to compare the quality of AI-generated formative feedback from 2 different settings, feedback generated in a zero-shot setting (hereafter, “zero-shot feedback”) and feedback generated in a few-shot setting (hereafter, “few-shot feedback”), using a mixed methods approach in Japanese physical therapy education. To examine the effect of algorithm aversion on these 2 feedback types, this study investigated the following research questions: How do physical therapy students evaluate zero-shot and few-shot feedback? How do their evaluations change before and after revealing the identity of the feedback?</p>
        <p>The findings offer practical guidelines for the effective integration of generative AI into health profession education.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Participants</title>
        <p>An a priori power analysis was conducted using G*Power (version 3.1.9.7) to determine the required sample size for a Wilcoxon signed rank test. The minimum required sample size was calculated to be 74 based on an assumed effect size of 0.3, an α level of .05, and statistical power of 0.80.</p>
        <p>A total of 40 fourth-year students from a 4-year physical therapy college in Japan were invited to participate in the study. Of these 40 students, 35 (88%) provided informed consent and were included in the final sample (n=22, 63% male and n=13, 37% female; mean age 21.4, SD 0.7 years). Their mean third-year grade point average was 2.8 (SD 0.5) on a 4-point scale. The final sample size did not reach the 74 estimated by the power analysis. This limitation was due to the exploratory nature of this study, which recruited from a single cohort at a single institution. Consequently, the findings should be interpreted with caution as the reduced statistical power increases the risk of type II error.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>All procedures performed in this study were in accordance with the ethical standards of the Declaration of Helsinki. Written informed consent was obtained from all participants, and a comprehensive verbal and written explanation of the study’s content was provided. This study was approved by the Research Ethics Committee of Tokyo Gakugei University (approval 1022). Participation was voluntary, and no incentives were provided. To protect participant privacy and confidentiality, all data were anonymized, and identifying details were omitted from the analysis and report.</p>
      </sec>
      <sec>
        <title>Procedure</title>
        <p>We administered a survey on the use of generative AI tools. This survey included items on (1) past experience with LLMs; (2) the LLM tool they used most frequently; and (3) the frequency of LLM use for 5 specific tasks: academic writing, gathering information, translating, generating new ideas, and proofreading, which were adapted from a large-scale global survey [<xref ref-type="bibr" rid="ref36">36</xref>]. This frequency was measured on a 5-point Likert scale (1=“never”; 5=“always”).</p>
        <p>This study, conducted in July 2025, used a mixed methods approach to compare the quality of zero-shot and few-shot feedback from the perspective of Japanese physical therapy students. This study involved a quantitative evaluation using a questionnaire and a qualitative analysis of semistructured focus group interviews.</p>
        <p>The procedure for this study consisted of 4 main phases. First, the 2 types of feedback were generated. Zero-shot feedback was created using the web-based interface of Gemini 2.5 Pro (Google) using the platform’s default settings (eg, default temperature) without any manual parameter adjustments. Few-shot feedback was created using the same model and default settings by providing Gemini 2.5 Pro with 9 examples of prior feedback comments as reference text. These reference comments were written by the first author (16 years of experience as a physical therapist and 5 years of experience as a physical therapy teacher) in May 2025. The comments were for different case reports written by different students. The exact user prompts used to create zero-shot and few-shot feedback, along with an example of prior teacher-created feedback, are provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Examples of zero-shot and few-shot feedback on a case report are provided in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>. No postprocessing or editing was performed on these 2 outputs.</p>
        <p>Second, in a blinded evaluation, participants assessed each type of feedback using the FPQ. After completing the FPQ, participants were asked to indicate which they perceived as more useful overall.</p>
        <p>Third, the identity of each feedback type was disclosed to the participants. Participants then re-evaluated the items they wished to change on their initial FPQ responses.</p>
        <p>Finally, semistructured focus group interviews were conducted with 26% (9/35) of the participants (3 male and 6 female). They were divided into 3 focus groups of 3 students, each lasting approximately 20 minutes. The interviews explored the rationale behind their perceptions of each feedback type. The interviewees were purposively selected to ensure a mix of students who had received relatively high and low faculty evaluations on their prior case reports.</p>
      </sec>
      <sec>
        <title>Data Analysis</title>
        <p>For the quantitative data, descriptive statistics were used to analyze the responses to the direct preference question: “Overall, which feedback comment do you feel is more useful?” The Wilcoxon signed rank test was then used to compare students’ evaluations of zero-shot and few-shot feedback on the median total score on the FPQ and the median scores for each individual FPQ item. Additionally, to address the risk of familywise error from multiple comparisons across the 18 individual FPQ items, adjusted <italic>P</italic> values were calculated using the Bonferroni correction. Following the disclosure of the feedback identity, the number of students whose evaluation became more positive or more negative for each FPQ item was counted. All statistical analyses were performed using Stata/BE (version 19.0; StataCorp LLC), with a significance level set at <italic>P</italic>&#60;.05.</p>
        <p>The interviews were audio recorded and transcribed verbatim, with the transcripts serving as the data for analysis. The qualitative analysis followed four main steps: (1) relevant utterances were extracted as meaningful units; (2) each unit was assigned a code; (3) similar codes were inductively grouped into subcategories; and (4) guided by the study’s objective to clarify the characteristics of each feedback type, these subcategories were then organized and integrated into predetermined categories. This analytical process was not strictly linear but recursive, involving movement back and forth between these steps to refine the codes, categories, and themes, consistent with the principles of thematic analysis [<xref ref-type="bibr" rid="ref37">37</xref>].</p>
        <p>We maintained a rigorous audit trail using Google Sheets. The platform’s version history, combined with analytical memos recorded in the document, provided a transparent record of our iterative coding and thematic development process. To ensure the validity of this qualitative analysis, the final codes and categories were determined through discussion and consensus among the 3 authors. Moreover, to verify coding reliability, an external coder (an experienced physical therapy teacher) independently classified 50% (21/42) of the codes into the categories defined by the authors. Interrater reliability was assessed using the Cohen κ. The κ coefficient was 0.504 (95% CI 0.351-0.656), indicating a statistically significant, moderate agreement beyond chance (<italic>Z</italic>=6.47; <italic>P</italic>&#60;.001).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>All participants reported having prior experience with LLMs. Regarding the most frequently used tool, a clear majority of students reported using ChatGPT (32/35, 91%), followed by Gemini (2/35, 6%) and Microsoft Copilot (1/35, 3%). <xref rid="figure1" ref-type="fig">Figure 1</xref> shows the results for the frequency of LLM use for the 5 specific tasks.</p>
      <fig id="figure1" position="float">
        <label>Figure 1</label>
        <caption>
          <p>Frequency of large language model use for specific tasks (N=35; 1=“never”; 5=“always”).</p>
        </caption>
        <graphic xlink:href="mededu_v11i1e85614_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <p><xref rid="figure2" ref-type="fig">Figure 2</xref> shows the box-and-whisker plot comparing student perceptions of zero-shot and few-shot feedback across all 18 FPQ items. Detailed statistical results of the FPQ scores are provided in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>.</p>
      <fig id="figure2" position="float">
        <label>Figure 2</label>
        <caption>
          <p>Box-and-whisker plot comparing student perceptions of zero-shot and few-shot feedback across all 18 Feedback Perceptions Questionnaire (FPQ) items. Q: item.</p>
        </caption>
        <graphic xlink:href="mededu_v11i1e85614_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <p>The Cronbach α coefficients indicated acceptable to excellent internal consistency for most scales (Cronbach α≥0.71), with the exception of the acceptance scale for few-shot feedback (Cronbach α=0.58). To further examine the low reliability of this specific scale, additional reliability analyses were conducted for few-shot feedback to examine whether removing an item would improve internal consistency. These analyses indicated that omitting item 8 (retaining items 7 and 9; Cronbach α=0.56), item 9 (retaining items 7 and 8; Cronbach α=0.59), or item 7 (retaining items 8 and 9; Cronbach α=0.31) did not meaningfully increase the reliability beyond the original 3-item scale (Cronbach α=0.58). Therefore, all 3 items were retained, with the understanding that findings related to the acceptance scale must be interpreted with caution.</p>
      <p>Regarding the overall usefulness preference, a clear majority of students (26/35, 74%) selected few-shot feedback as more useful than zero-shot feedback, although no significant difference was found between the 2 feedback types for the FPQ score (<italic>P</italic>=.22).</p>
      <p>The Wilcoxon signed rank test revealed several statistically significant differences before correction for multiple comparisons. On the specific FPQ scales, few-shot feedback scored significantly higher than zero-shot feedback on fairness across all 3 items: “satisfied” (<italic>P</italic>=.02; <italic>r</italic>=0.407), “fair” (<italic>P</italic>=.04; <italic>r</italic>=0.341), and “justified” (<italic>P</italic>=.02; <italic>r</italic>=0.392). Few-shot feedback also scored significantly higher on 1 item of the usefulness scale (“useful”; <italic>P</italic>=.02; <italic>r</italic>=0.401) and 1 item of the willingness scale (“invest a lot of effort”; <italic>P</italic>=.02; <italic>r</italic>=0.394). In contrast, for the affect scale, zero-shot feedback elicited significantly more positive emotions and less negative emotions. Specifically, students reported feeling significantly more “successful” (<italic>P</italic>=.03; <italic>r</italic>=0.365) and significantly less “angry” (<italic>P</italic>=.008; <italic>r</italic>=0.443) with zero-shot feedback compared to few-shot feedback. However, after applying the Bonferroni correction to address the risk of familywise error from multiple comparisons across the 18 items, none of these differences remained statistically significant (<xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref> provides detailed adjusted <italic>P</italic> values).</p>
      <p><xref rid="figure3" ref-type="fig">Figure 3</xref> illustrates the number of students whose evaluations for each of the 18 FPQ items changed after the feedback identities were revealed. Detailed data on the direction of changes in FPQ scores for each item are provided in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>. As this analysis focused on the direction of change (ie, positive or negative) rather than its magnitude, the following description compares the direction in which impressions shifted for each item. After the reveal, evaluations of zero-shot feedback tended to become more negative. For 83% (15/18) of the items, more students lowered their rating for zero-shot feedback than for few-shot feedback. In contrast, evaluations of few-shot feedback tended to become more positive. For all 18 items, a greater number of students increased their rating for few-shot feedback compared to zero-shot feedback. The proportion of students whose evaluations remained completely unchanged was 54% (19/35) for zero-shot feedback and 57% (20/35) for few-shot feedback.</p>
      <fig id="figure3" position="float">
        <label>Figure 3</label>
        <caption>
          <p>Comparison of the number of students with increased (“up”) or decreased (“down”) evaluation scores for zero-shot and few-shot feedback on each Feedback Perceptions Questionnaire item after the feedback identity was revealed. Q: item.</p>
        </caption>
        <graphic xlink:href="mededu_v11i1e85614_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <p><xref ref-type="table" rid="table2">Table 2</xref> presents students’ evaluations of each feedback type through focus group interviews. The qualitative analysis revealed both common and distinct characteristics of zero-shot and few-shot feedback.</p>
      <table-wrap position="float" id="table2">
        <label>Table 2</label>
        <caption>
          <p>Students’ evaluations of each feedback type.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="230"/>
          <col width="120"/>
          <col width="150"/>
          <col width="470"/>
          <thead>
            <tr valign="top">
              <td colspan="2">Category and subcategory</td>
              <td>Valence</td>
              <td>Speaker ID</td>
              <td>Example quotes</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="5">
                <bold>Zero-shot feedback</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Praising tone</td>
              <td>Positive</td>
              <td>D, E, F, G, H, and I</td>
              <td>“Zero-shot feedback makes me feel good, so it’s the one I would want to read first to get motivated.” [F]</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Excessive and unrealistic praise</td>
              <td>Negative</td>
              <td>K and L</td>
              <td>“Zero-shot feedback is overpraising—basically nothing but praise. It feels over the top.” [K]</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Enhancement of readability</td>
              <td>Positive</td>
              <td>J</td>
              <td>“The comments on writing structure were helpful.” [J]</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Clarification of vague points</td>
              <td>Positive</td>
              <td>D, F, H, and J</td>
              <td>“Zero-shot feedback is convincing because it points out the areas I am unclear about.” [D]</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Lack of critical comments</td>
              <td>Negative</td>
              <td>E, G, and H</td>
              <td>“Zero-shot feedback gives a lot of praise and is very affirming, but I feel it lacks critical comments, which leaves me feeling unsatisfied and wondering if it’s really good enough.” [E]</td>
            </tr>
            <tr valign="top">
              <td colspan="5">
                <bold>Few-shot feedback</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Praising tone</td>
              <td>Positive</td>
              <td>F</td>
              <td>“Few-shot feedback makes me happy because it ends with an encouraging phrase.” [F]</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Justified praise</td>
              <td>Positive</td>
              <td>L</td>
              <td>“I felt few-shot feedback praised the parts it genuinely considered good.” [L]</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Lack of praising tone</td>
              <td>Negative</td>
              <td>I</td>
              <td>“I want feedback to tell me what’s good. If I read only few-shot feedback, I end up thinking, ‘Should I just rebuild the whole thing from scratch?’” [I]</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Enhancement of readability</td>
              <td>Positive</td>
              <td>D and L</td>
              <td>“Few-shot feedback is helpful because it revises the text to make it easier for the reader to understand.” [D]</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Example sentences</td>
              <td>Positive</td>
              <td>E</td>
              <td>“Few-shot feedback is helpful because it gives example sentences, which makes the feedback easier to imagine.” [E]</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Identification of areas for improvement</td>
              <td>Positive</td>
              <td>I, K, and L</td>
              <td>“Few-shot feedback offered comments such as ‘you might also include...’ and ‘it would be good to consider...,’ which made me realize what I was missing. It directly addressed my areas for improvement.” [I]</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Perceived teacher authorship</td>
              <td>—<sup>a</sup></td>
              <td>I</td>
              <td>“I thought the feedback had been written by the teacher pretending to be AI.” [I]</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table2fn1">
            <p><sup>a</sup>The valence was not clearly identifiable as positive or negative.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <p>A shared subcategory for both feedback types was “praising tone,” but its quality and degree were perceived differently. For zero-shot feedback, most students (6/9, 67%) found the praise motivating and felt that it made them happy. However, this was also described negatively by some as excessive and unrealistic praise:</p>
      <disp-quote>
        <p>Zero-shot feedback is overpraising—basically nothing but praise. It feels over the top.</p>
        <attrib>K</attrib>
      </disp-quote>
      <p>In contrast, few-shot feedback’s praise was perceived as more justified and authentic, although a student noted a lack of praising tone compared to zero-shot feedback:</p>
      <disp-quote>
        <p>I felt few-shot feedback praised the parts it genuinely considered good.</p>
        <attrib>L</attrib>
      </disp-quote>
      <p>Regarding the feedback content, zero-shot feedback was positively valued for its clarification of vague points and its enhancement of readability through comments on writing structure. Conversely, a key drawback noted by students was a lack of critical comments, which left them feeling unsatisfied and uncertain about their work’s actual quality.</p>
      <p>Few-shot feedback was also praised for its enhancement of readability. Furthermore, students highlighted its unique strengths in providing concrete example sentences, which made the feedback easier to imagine, and its clear identification of areas for improvement. Notably, a student commented on the perceived teacher authorship of few-shot feedback, thinking it had been written by a teacher pretending to be AI.</p>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Interpretation of the Results</title>
        <p>This study aimed to evaluate the quality of few-shot feedback on case reports by comparing it with zero-shot feedback in Japanese physical therapy education using a mixed methods approach. The quantitative results showed that 74% (26/35) of the students preferred few-shot feedback to zero-shot feedback for overall usefulness, although no significant difference was found between the total FPQ scores for the 2 feedback types. The qualitative analysis revealed that zero-shot feedback was favored for its praising tone, whereas few-shot feedback was valued for its concrete guidance for improvement. Furthermore, after the feedback identities were revealed, the positive perception of few-shot feedback was maintained, whereas evaluations for zero-shot feedback tended to become more negative. This suggests that, even though both feedback types were AI generated, the impact of algorithm aversion differs depending on the generation condition.</p>
        <p>While no significant difference was observed between the total FPQ scores for zero-shot and few-shot feedback, the Wilcoxon signed rank test on specific FPQ scales demonstrated that few-shot feedback scored significantly higher in fairness, usefulness, and willingness on several key items. Conversely, zero-shot feedback scored significantly higher on the affect scale, eliciting more positive emotions from students. However, after applying the Bonferroni correction for multiple comparisons, none of these differences remained statistically significant. These results must be interpreted with caution given that the study’s statistical power was limited, which increases the risk of type II error. Considering this limitation, coupled with the exploratory nature of this research into the novel area of few-shot feedback, the FPQ items that showed significant differences before correction may indicate potential trends. These items warrant further investigation in future, larger-scale studies, where they might serve to corroborate the findings of the qualitative analysis.</p>
        <p>The qualitative analysis revealed that students appreciated the encouraging and praising tone of zero-shot feedback. Regarding few-shot feedback, they valued its more specific and justified praising comments, even if the praise was less frequent. Considering research indicating that LLMs can be more encouraging than humans [<xref ref-type="bibr" rid="ref38">38</xref>] and that humans tend to focus on areas for improvement rather than praise [<xref ref-type="bibr" rid="ref39">39</xref>], this suggests that the praising tone of few-shot feedback may have decreased as it imitated these human elements. To ensure a strict comparison between the 2 feedback types in this study, we intentionally made no adjustments to the prompts to control for this praising tone. However, future research should examine how student perceptions change when prompts are adjusted to control for this praising tone as such prompt engineering might lead to few-shot feedback being perceived more favorably by students. Furthermore, our results using Gemini 2.5 Pro may not generalize to other LLMs as outputs can differ significantly between models even when using identical prompts [<xref ref-type="bibr" rid="ref40">40</xref>-<xref ref-type="bibr" rid="ref43">43</xref>]. Moreover, as LLMs are updated frequently, future model updates might enable even zero-shot settings to produce more personalized and contextual outputs based on a user’s past data, potentially altering the findings of this study. Given these factors, future research should compare the quality of zero-shot and few-shot feedback across different LLMs.</p>
        <p>While students appreciated that zero-shot feedback helped clarify vague points, they noted that it lacked the critical comments necessary for further improvement. In contrast, few-shot feedback was perceived more favorably because it not only pointed out areas for improvement but also offered concrete strategies on how to make those improvements by providing specific textual examples. This ability was interpreted as a form of contextual understanding as the few-shot feedback seemed to infer unstated information from the case report. A study by Pahi et al [<xref ref-type="bibr" rid="ref38">38</xref>], which explored a collaborative feedback process involving teaching assistants and ChatGPT, revealed that teaching assistants were particularly effective at providing detailed technical comments and identifying conceptual gaps. Similarly, a large-scale study by Henderson et al [<xref ref-type="bibr" rid="ref39">39</xref>] across 4 Australian universities investigating perceptions of AI and human feedback found that students perceived human feedback as more in depth (nuanced) and contextualized than AI feedback. These findings are consistent with the results of our study and are supported by a report from the Organisation for Economic Co-operation and Development (OECD) [<xref ref-type="bibr" rid="ref9">9</xref>], which notes that current AI systems still face significant challenges in qualitative reasoning and interpreting unstructured contexts. This suggests that, although no direct human intervention was applied, the human element from the leveraged teacher-created examples may have influenced the few-shot feedback to provide these more conceptual and clinical insights that AI cannot yet fully replicate.</p>
        <p>A central finding was the significant shift in student perceptions after disclosure of the feedback’s identity. Feedback effectiveness depends on how students perceive its source (eg, teacher, peer, and parents) regardless of the feedback’s quality [<xref ref-type="bibr" rid="ref44">44</xref>]. This distinction is crucial when considering algorithm aversion. In our study, zero-shot feedback tended to be re-evaluated negatively after its identity was revealed, which aligns with prior research [<xref ref-type="bibr" rid="ref31">31</xref>]. This phenomenon likely reflects a lack of trust in the feedback source [<xref ref-type="bibr" rid="ref30">30</xref>]. In contrast, few-shot feedback showed resistance to algorithm aversion. This suggests that the few-shot setting inherited perceived humanlike qualities and enhanced its trustworthiness [<xref ref-type="bibr" rid="ref39">39</xref>], thus mitigating the negative effects of algorithm aversion.</p>
      </sec>
      <sec>
        <title>Limitations and Future Directions</title>
        <p>While the generalizability of our research is constrained by the limited number of participants and its single-institution context in Japan, the findings hold significant transferability to the broader health sciences education contexts, such as occupational therapy, nursing, and pharmacy. As the challenge of providing high-quality, real-time formative feedback to cultivate students’ clinical reasoning is common to these fields, our few-shot feedback model offers foundational insights for advancing the use of AI in health profession education. To validate the applicability of this model, future work should involve cross-institutional and multidisciplinary studies. Furthermore, comparative trials and longitudinal studies will be necessary to validate the hypothesis that the few-shot feedback can more effectively develop students’ clinical reasoning skills than other feedback types, including human-created feedback.</p>
      </sec>
      <sec>
        <title>Implications</title>
        <p>As the few-shot feedback methodology presented in this paper only requires providing an LLM with examples of a teacher’s prior feedback and using a simple prompt, it demands little specialized AI knowledge or skills. The United Nations Educational, Scientific, and Cultural Organization (UNESCO) AI framework [<xref ref-type="bibr" rid="ref45">45</xref>] states that teachers are expected to acquire skills to adapt or customize AI tools to build human-centered teaching practice. While acquiring such skills is a valuable long-term goal, it can be challenging, particularly for novice teachers. Therefore, the few-shot feedback model offers a highly practical and immediately accessible solution that lowers the barrier to entry for AI integration.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This study demonstrated that Japanese physical therapy students perceived few-shot feedback more favorably than zero-shot feedback on case reports and that this few-shot feedback model showed potential to mitigate algorithm aversion. This few-shot AI model is expected to serve as an effective support tool that empowers students to autonomously write case reports, reflect on their clinical reasoning processes, and cultivate advanced thinking skills.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Prompts for creating zero-shot and few-shot feedback with an example of prior teacher-created feedback.</p>
        <media xlink:href="mededu_v11i1e85614_app1.doc" xlink:title="DOC File , 40 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Examples of zero-shot and few-shot feedback on a case report.</p>
        <media xlink:href="mededu_v11i1e85614_app2.doc" xlink:title="DOC File , 56 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Detailed statistical results of the Feedback Perceptions Questionnaire scores.</p>
        <media xlink:href="mededu_v11i1e85614_app3.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 16 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Detailed data on the direction of changes in Feedback Perceptions Questionnaire scores for each item.</p>
        <media xlink:href="mededu_v11i1e85614_app4.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 11 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">FPQ</term>
          <def>
            <p>Feedback Perceptions Questionnaire</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">OECD</term>
          <def>
            <p>Organisation for Economic Co-operation and Development</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">UNESCO</term>
          <def>
            <p>United Nations Educational, Scientific, and Cultural Organization</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <notes>
      <sec>
        <title>Funding</title>
        <p>No external financial support or grants were received from any public, commercial, or not-for-profit entities for the research, authorship, or publication of this paper.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Zary</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Applications and challenges of implementing artificial intelligence in medical education: integrative review</article-title>
          <source>JMIR Med Educ</source>
          <year>2019</year>
          <month>06</month>
          <day>15</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>e13930</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2019/1/e13930/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/13930</pub-id>
          <pub-id pub-id-type="medline">31199295</pub-id>
          <pub-id pub-id-type="pii">v5i1e13930</pub-id>
          <pub-id pub-id-type="pmcid">PMC6598417</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Safranek</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Sidamon-Eristoff</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Gilson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chartash</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The role of large language models in medical education: applications and implications</article-title>
          <source>JMIR Med Educ</source>
          <year>2023</year>
          <month>08</month>
          <day>14</day>
          <volume>9</volume>
          <fpage>e50945</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2023//e50945/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/50945</pub-id>
          <pub-id pub-id-type="medline">37578830</pub-id>
          <pub-id pub-id-type="pii">v9i1e50945</pub-id>
          <pub-id pub-id-type="pmcid">PMC10463084</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tam</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Huynh</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Luong</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Khatri</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Nursing education in the age of artificial intelligence powered chatbots (AI-chatbots): are we ready yet?</article-title>
          <source>Nurse Educ Today</source>
          <year>2023</year>
          <month>10</month>
          <volume>129</volume>
          <fpage>105917</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0260-6917(23)00211-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.nedt.2023.105917</pub-id>
          <pub-id pub-id-type="medline">37506622</pub-id>
          <pub-id pub-id-type="pii">S0260-6917(23)00211-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gordon</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Daniel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ajiboye</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Uraiby</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>NY</given-names>
            </name>
            <name name-style="western">
              <surname>Bartlett</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hanson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Haas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Spadafore</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Grafton-Clarke</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gasiea</surname>
              <given-names>RY</given-names>
            </name>
            <name name-style="western">
              <surname>Michie</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Corral</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kwan</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Dolmans</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Thammasitboon</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A scoping review of artificial intelligence in medical education: BEME guide no. 84</article-title>
          <source>Med Teach</source>
          <year>2024</year>
          <month>02</month>
          <day>29</day>
          <volume>46</volume>
          <issue>4</issue>
          <fpage>446</fpage>
          <lpage>70</lpage>
          <pub-id pub-id-type="doi">10.1080/0142159x.2024.2314198</pub-id>
          <pub-id pub-id-type="medline">38423127</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kovalainen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Pramila-Savukoski</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kuivila</surname>
              <given-names>HM</given-names>
            </name>
            <name name-style="western">
              <surname>Juntunen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jarva</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Rasi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mikkonen</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Utilising artificial intelligence in developing education of health sciences higher education: an umbrella review of reviews</article-title>
          <source>Nurse Educ Today</source>
          <year>2025</year>
          <month>04</month>
          <volume>147</volume>
          <fpage>106600</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0260-6917(25)00035-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.nedt.2025.106600</pub-id>
          <pub-id pub-id-type="medline">39904286</pub-id>
          <pub-id pub-id-type="pii">S0260-6917(25)00035-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tekin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yurdal</surname>
              <given-names>MO</given-names>
            </name>
            <name name-style="western">
              <surname>Toraman</surname>
              <given-names>Ç</given-names>
            </name>
            <name name-style="western">
              <surname>Korkmaz</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Uysal</surname>
              <given-names>İ</given-names>
            </name>
          </person-group>
          <article-title>Is AI the future of evaluation in medical education?? AI vs. human evaluation in objective structured clinical examination</article-title>
          <source>BMC Med Educ</source>
          <year>2025</year>
          <month>05</month>
          <day>01</day>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>641</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmededuc.biomedcentral.com/articles/10.1186/s12909-025-07241-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12909-025-07241-4</pub-id>
          <pub-id pub-id-type="medline">40312328</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12909-025-07241-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC12046780</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pham</surname>
              <given-names>TD</given-names>
            </name>
            <name name-style="western">
              <surname>Karunaratne</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Exintaris</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lay</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Yuriev</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>The impact of generative AI on health professional education: a systematic review in the context of student learning</article-title>
          <source>Med Educ</source>
          <year>2025</year>
          <month>12</month>
          <day>18</day>
          <volume>59</volume>
          <issue>12</issue>
          <fpage>1280</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1111/medu.15746</pub-id>
          <pub-id pub-id-type="medline">40533396</pub-id>
          <pub-id pub-id-type="pmcid">PMC12686775</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Prégent</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>VH</given-names>
            </name>
            <name name-style="western">
              <surname>El Adib</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Désilets</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hudon</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Applications of artificial intelligence in psychiatry and psychology education: scoping review</article-title>
          <source>JMIR Med Educ</source>
          <year>2025</year>
          <month>07</month>
          <day>28</day>
          <volume>11</volume>
          <fpage>e75238</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2025//e75238/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/75238</pub-id>
          <pub-id pub-id-type="medline">40720804</pub-id>
          <pub-id pub-id-type="pii">v11i1e75238</pub-id>
          <pub-id pub-id-type="pmcid">PMC12340458</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="web">
          <article-title>Introducing the OECD AI capability indicators</article-title>
          <source>Organisation for Economic Co-operation and Development</source>
          <access-date>2025-08-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.oecd.org/en/publications/introducing-the-oecd-ai-capability-indicators_be745f04-en">https://www.oecd.org/en/publications/introducing-the-oecd-ai-capability-indicators_be745f04-en</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kassirer</surname>
              <given-names>JP</given-names>
            </name>
          </person-group>
          <article-title>Teaching clinical reasoning: case-based and coached</article-title>
          <source>Acad Med</source>
          <year>2010</year>
          <month>07</month>
          <volume>85</volume>
          <issue>7</issue>
          <fpage>1118</fpage>
          <lpage>24</lpage>
          <pub-id pub-id-type="doi">10.1097/acm.0b013e3181d5dd0d</pub-id>
          <pub-id pub-id-type="medline">20603909</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Florek</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Dellavalle</surname>
              <given-names>RP</given-names>
            </name>
          </person-group>
          <article-title>Case reports in medical education: a platform for training medical students, residents, and fellows in scientific writing and critical thinking</article-title>
          <source>J Med Case Rep</source>
          <year>2016</year>
          <month>04</month>
          <day>06</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>86</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jmedicalcasereports.biomedcentral.com/articles/10.1186/s13256-016-0851-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13256-016-0851-5</pub-id>
          <pub-id pub-id-type="medline">27048362</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13256-016-0851-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC4822269</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hartjes</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Schilder</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>van Unen</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Richir</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>van Agtmael</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Tichelaar</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Therapeutic reasoning in case reports: insights into current reporting and learning opportunities</article-title>
          <source>Br J Clin Pharmacol</source>
          <year>2025</year>
          <month>11</month>
          <day>19</day>
          <volume>91</volume>
          <issue>11</issue>
          <fpage>3236</fpage>
          <lpage>43</lpage>
          <pub-id pub-id-type="doi">10.1002/bcp.70176</pub-id>
          <pub-id pub-id-type="medline">40682527</pub-id>
          <pub-id pub-id-type="pmcid">PMC12569556</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fleckenstein</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liebenow</surname>
              <given-names>LW</given-names>
            </name>
            <name name-style="western">
              <surname>Meyer</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Automated feedback and writing: a multi-level meta-analysis of effects on students' performance</article-title>
          <source>Front Artif Intell</source>
          <year>2023</year>
          <month>7</month>
          <day>3</day>
          <volume>6</volume>
          <fpage>1162454</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37465061"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/frai.2023.1162454</pub-id>
          <pub-id pub-id-type="medline">37465061</pub-id>
          <pub-id pub-id-type="pmcid">PMC10351274</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meyer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jansen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Schiller</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Liebenow</surname>
              <given-names>LW</given-names>
            </name>
            <name name-style="western">
              <surname>Steinbach</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Horbach</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fleckenstein</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Using LLMs to bring evidence-based feedback into the classroom: AI-generated feedback increases secondary students’ text revision, motivation, and positive emotions</article-title>
          <source>Comput Educ Artif Intell</source>
          <year>2024</year>
          <month>06</month>
          <volume>6</volume>
          <fpage>100199</fpage>
          <pub-id pub-id-type="doi">10.1016/j.caeai.2023.100199</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Enhancing critical writing through AI feedback: a randomized control study</article-title>
          <source>Behav Sci (Basel)</source>
          <year>2025</year>
          <month>04</month>
          <day>30</day>
          <volume>15</volume>
          <issue>5</issue>
          <fpage>600</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=bs15050600"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/bs15050600</pub-id>
          <pub-id pub-id-type="medline">40426378</pub-id>
          <pub-id pub-id-type="pii">bs15050600</pub-id>
          <pub-id pub-id-type="pmcid">PMC12109289</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gaeta</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Orciuoli</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Pascuzzo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Peduto</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Enhancing traditional ITS architectures with large language models for generating motivational feedback</article-title>
          <source>Comput Educ Artif Intell</source>
          <year>2025</year>
          <month>12</month>
          <volume>9</volume>
          <fpage>100433</fpage>
          <pub-id pub-id-type="doi">10.1016/j.caeai.2025.100433</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shute</surname>
              <given-names>VJ</given-names>
            </name>
          </person-group>
          <article-title>Focus on formative feedback</article-title>
          <source>Rev Educ Res</source>
          <year>2008</year>
          <month>03</month>
          <day>01</day>
          <volume>78</volume>
          <issue>1</issue>
          <fpage>153</fpage>
          <lpage>89</lpage>
          <pub-id pub-id-type="doi">10.3102/0034654307313795</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bucol</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Sangkawong</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Exploring ChatGPT as a writing assessment tool</article-title>
          <source>Innov Educ Teach Int</source>
          <year>2024</year>
          <month>06</month>
          <day>07</day>
          <volume>62</volume>
          <issue>3</issue>
          <fpage>867</fpage>
          <lpage>82</lpage>
          <pub-id pub-id-type="doi">10.1080/14703297.2024.2363901</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Tsai</surname>
              <given-names>YS</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Aldino</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gašević</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Assessing the proficiency of large language models in automatic feedback generation: an evaluation study</article-title>
          <source>Comput Educ Artif Intell</source>
          <year>2024</year>
          <month>12</month>
          <volume>7</volume>
          <fpage>100299</fpage>
          <pub-id pub-id-type="doi">10.1016/j.caeai.2024.100299</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chai</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Aubrey</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Comparing the effects of ChatGPT and automated writing evaluation on students’ writing and ideal L2 writing self</article-title>
          <source>Comput Assist Lang Learn</source>
          <year>2025</year>
          <month>02</month>
          <day>03</day>
          <fpage>1</fpage>
          <lpage>28</lpage>
          <pub-id pub-id-type="doi">10.1080/09588221.2025.2454541</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Seßler</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Bewersdorff</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nerdel</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kasneci</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Towards adaptive feedback with AI: comparing the feedback quality of LLMs and teachers on experimentation protocols</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online February 18, 2025</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2502.12842"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2502.12842</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Banihashem</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Kerman</surname>
              <given-names>NT</given-names>
            </name>
            <name name-style="western">
              <surname>Noroozi</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Moon</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Drachsler</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Feedback sources in essay writing: peer-generated or AI-generated feedback?</article-title>
          <source>Int J Educ Technol High Educ</source>
          <year>2024</year>
          <month>04</month>
          <day>12</day>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>15</lpage>
          <pub-id pub-id-type="doi">10.1186/s41239-024-00455-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Escalante</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pack</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Barrett</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>AI-generated feedback on writing: insights into efficacy and ENL student preference</article-title>
          <source>Int J Educ Technol High Educ</source>
          <year>2023</year>
          <month>10</month>
          <day>27</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>57</fpage>
          <pub-id pub-id-type="doi">10.1186/S41239-023-00425-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vaccaro</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Almaatouq</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Malone</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>When combinations of humans and AI are useful: a systematic review and meta-analysis</article-title>
          <source>Nat Hum Behav</source>
          <year>2024</year>
          <month>12</month>
          <day>28</day>
          <volume>8</volume>
          <issue>12</issue>
          <fpage>2293</fpage>
          <lpage>303</lpage>
          <pub-id pub-id-type="doi">10.1038/s41562-024-02024-1</pub-id>
          <pub-id pub-id-type="medline">39468277</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41562-024-02024-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC11659167</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Capellini</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Atienza</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Sconfield</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Knowledge accuracy and reducing hallucinations in LLMs via dynamic domain knowledge injection</article-title>
          <source>Research Square</source>
          <comment>Preprint posted online on Jun 6, 2024</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchsquare.com/article/rs-4540506/v1"/>
          </comment>
          <pub-id pub-id-type="doi">10.21203/rs.3.rs-4540506/v1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sui</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>A survey on in-context learning</article-title>
          <source>Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing</source>
          <year>2024</year>
          <conf-name>EMNLP '24</conf-name>
          <conf-date>November 12-16, 2024</conf-date>
          <conf-loc>Miami, FL</conf-loc>
          <fpage>1107</fpage>
          <lpage>28</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/2024.emnlp-main.64.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/2024.emnlp-main.64</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>TB</given-names>
            </name>
            <name name-style="western">
              <surname>Mann</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ryder</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Subbiah</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kaplan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dhariwal</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Neelakantan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shyam</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sastry</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Askell</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Agarwal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Herbert-Voss</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Krueger</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Henighan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Child</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ramesh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ziegler</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Winter</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hesse</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sigler</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Litwin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gray</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chess</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Berner</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>McCandlish</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Radford</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sutskever</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Amodei</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Language models are few-shot learners</article-title>
          <source>Proceedings of the 34th International Conference on Neural Information Processing Systems</source>
          <year>2020</year>
          <conf-name>NIPS '20</conf-name>
          <conf-date>December 6-12, 2020</conf-date>
          <conf-loc>Vancouver, BC</conf-loc>
          <fpage>1877</fpage>
          <lpage>901</lpage>
          <pub-id pub-id-type="doi">10.5555/3495724.3495883</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rüdian</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Podelo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kužílek</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pinkwart</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Feedback on feedback: student’s perceptions for feedback from teachers and few-shot LLMs</article-title>
          <source>Proceedings of the 15th International Learning Analytics and Knowledge Conference</source>
          <year>2025</year>
          <conf-name>LAK '25</conf-name>
          <conf-date>March 3-7, 2025</conf-date>
          <conf-loc>Dublin, Ireland</conf-loc>
          <fpage>82</fpage>
          <lpage>92</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/3706468.3706479"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3706468.3706479</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dietvorst</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Simmons</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Massey</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Algorithm aversion: people erroneously avoid algorithms after seeing them err</article-title>
          <source>J Exp Psychol Gen</source>
          <year>2015</year>
          <month>02</month>
          <volume>144</volume>
          <issue>1</issue>
          <fpage>114</fpage>
          <lpage>26</lpage>
          <pub-id pub-id-type="doi">10.1037/xge0000033</pub-id>
          <pub-id pub-id-type="medline">25401381</pub-id>
          <pub-id pub-id-type="pii">2014-48748-001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nazaretsky</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mejia-Domenzain</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Swamy</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Frej</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Käser</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>AI or human? Evaluating student feedback perceptions in higher education</article-title>
          <source>Proceedings of the 2024 Conference on Technology Enhanced Learning for Inclusive and Equitable Quality Education: 19th European Conference on Technology Enhanced Learning</source>
          <year>2024</year>
          <conf-name>EC-TEL '24</conf-name>
          <conf-date>September 16-20, 2024</conf-date>
          <conf-loc>Krems, Austria</conf-loc>
          <fpage>2024</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1007/978-3-031-72315-5_20"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/978-3-031-72315-5_20</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Suraworachet</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Nazaretsky</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Cukurova</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Evaluating trust in AI, human, and co-produced feedback among undergraduate students</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online April 15, 2025</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2504.10961"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2504.10961</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Strijbos</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Narciss</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dünnebier</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Peer feedback content and sender's competence level in academic writing revision tasks: are they critical for feedback perceptions and efficiency?</article-title>
          <source>Learn Instr</source>
          <year>2010</year>
          <month>8</month>
          <volume>20</volume>
          <issue>4</issue>
          <fpage>291</fpage>
          <lpage>303</lpage>
          <pub-id pub-id-type="doi">10.1016/j.learninstruc.2009.08.008</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Strijbos</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Pat-El</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Narciss</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Structural validity and invariance of the feedback perceptions questionnaire</article-title>
          <source>Stud Educ Eval</source>
          <year>2021</year>
          <month>03</month>
          <volume>68</volume>
          <fpage>100980</fpage>
          <pub-id pub-id-type="doi">10.1016/j.stueduc.2021.100980</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Berndt</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Strijbos</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Fischer</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Effects of written peer-feedback content and sender’s competence on perceptions, performance, and mindful cognitive processing</article-title>
          <source>Eur J Psychol Educ</source>
          <year>2017</year>
          <month>8</month>
          <day>13</day>
          <volume>33</volume>
          <issue>1</issue>
          <fpage>31</fpage>
          <lpage>49</lpage>
          <pub-id pub-id-type="doi">10.1007/s10212-017-0343-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huisman</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Saab</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>van Driel</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>van den Broek</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Peer feedback on academic writing: undergraduate students’ peer feedback role, peer feedback perceptions and essay performance</article-title>
          <source>Assess Eval High Educ</source>
          <year>2018</year>
          <month>01</month>
          <day>07</day>
          <volume>43</volume>
          <issue>6</issue>
          <fpage>955</fpage>
          <lpage>68</lpage>
          <pub-id pub-id-type="doi">10.1080/02602938.2018.1424318</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ravšelj</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Keržič</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tomaževič</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Umek</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Brezovar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>A Iahad</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Abdulla</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Akopyan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Aldana Segura</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>AlHumaid</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Allam</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Alló</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Andoh</surname>
              <given-names>RP</given-names>
            </name>
            <name name-style="western">
              <surname>Andronic</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Arthur</surname>
              <given-names>YD</given-names>
            </name>
            <name name-style="western">
              <surname>Aydın</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Badran</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Balbontín-Alvarado</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ben Saad</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Bencsik</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Benning</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Besimi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bezerra</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>Buizza</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Burro</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bwalya</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cachero</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Castillo-Briceno</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Castro</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chai</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Charalambous</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chiu</surname>
              <given-names>TK</given-names>
            </name>
            <name name-style="western">
              <surname>Clipa</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Colombari</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Corral Escobedo</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Costa</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Crețulescu</surname>
              <given-names>RG</given-names>
            </name>
            <name name-style="western">
              <surname>Crispino</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cucari</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Dalton</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Demir Kaya</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dumić-Čule</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Dwidienawati</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ebardo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Egbenya</surname>
              <given-names>DL</given-names>
            </name>
            <name name-style="western">
              <surname>Faris</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Fečko</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ferrinho</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Florea</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fong</surname>
              <given-names>CY</given-names>
            </name>
            <name name-style="western">
              <surname>Francis</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Ghilardi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>González-Fernández</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Hau</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hossain</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Hug</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Inasius</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ismail</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Jahić</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Jessa</surname>
              <given-names>MO</given-names>
            </name>
            <name name-style="western">
              <surname>Kapanadze</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kar</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Kateeb</surname>
              <given-names>ET</given-names>
            </name>
            <name name-style="western">
              <surname>Kaya</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Khadri</surname>
              <given-names>HO</given-names>
            </name>
            <name name-style="western">
              <surname>Kikuchi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kobets</surname>
              <given-names>VM</given-names>
            </name>
            <name name-style="western">
              <surname>Kostova</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Krasmane</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Lau</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Law</surname>
              <given-names>WH</given-names>
            </name>
            <name name-style="western">
              <surname>Lazăr</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lazović-Pita</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>VW</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>López-Aguilar</surname>
              <given-names>DV</given-names>
            </name>
            <name name-style="western">
              <surname>Luca</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Luciano</surname>
              <given-names>RG</given-names>
            </name>
            <name name-style="western">
              <surname>Machin-Mastromatteo</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Madi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Manguele</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Manrique</surname>
              <given-names>RF</given-names>
            </name>
            <name name-style="western">
              <surname>Mapulanga</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Marimon</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Marinova</surname>
              <given-names>GI</given-names>
            </name>
            <name name-style="western">
              <surname>Mas-Machuca</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mejía-Rodríguez</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Meletiou-Mavrotheris</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Méndez-Prado</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Meza-Cano</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Mirķe</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mital</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Mollica</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Morariu</surname>
              <given-names>DI</given-names>
            </name>
            <name name-style="western">
              <surname>Mospan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Mukuka</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Navarro Jiménez</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Nikaj</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Nisheva</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Nisiforou</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Njiku</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Nomnian</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nuredini-Mehmedi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Nyamekye</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Obadić</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Okela</surname>
              <given-names>AH</given-names>
            </name>
            <name name-style="western">
              <surname>Olenik-Shemesh</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ostoj</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Peralta-Rizzo</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Peštek</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pilav-Velić</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pires</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Rabin</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Raccanello</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ramie</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rashid</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Reuter</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Reyes</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Rodrigues</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Rodway</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ručinská</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sadzaglishvili</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Salem</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Savić</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Schepman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shahpo</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Snouber</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Soler</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Sonyel</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Stefanova</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Stone</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Strzelecki</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tanaka</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tapia Cortes</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Teira-Fachado</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tilga</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Titko</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tolmach</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Turmudi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Varela-Candamio</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Vekiri</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Vicentini</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Woyo</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Yorulmaz</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Yunus</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Zamfir</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Aristovnik</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Higher education students' perceptions of ChatGPT: a global study of early reactions</article-title>
          <source>PLoS One</source>
          <year>2025</year>
          <month>2</month>
          <day>5</day>
          <volume>20</volume>
          <issue>2</issue>
          <fpage>e0315011</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0315011"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0315011</pub-id>
          <pub-id pub-id-type="medline">39908277</pub-id>
          <pub-id pub-id-type="pii">PONE-D-24-36762</pub-id>
          <pub-id pub-id-type="pmcid">PMC11798494</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Braun</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Clarke</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Using thematic analysis in psychology</article-title>
          <source>Qual Res Phycol</source>
          <year>2008</year>
          <month>07</month>
          <day>21</day>
          <volume>3</volume>
          <issue>2</issue>
          <fpage>77</fpage>
          <lpage>101</lpage>
          <pub-id pub-id-type="doi">10.1191/1478088706qp063oa</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pahi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Hawlader</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hicks</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Zaman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Phan</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Enhancing active learning through collaboration between human teachers and generative AI</article-title>
          <source>Comput Educ Open</source>
          <year>2024</year>
          <month>06</month>
          <volume>6</volume>
          <fpage>100183</fpage>
          <pub-id pub-id-type="doi">10.1016/j.caeo.2024.100183</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Henderson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bearman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fawns</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Buckingham Shum</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Matthews</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>de Mello Heredia</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Comparing generative AI and teacher feedback: student perceptions of usefulness and trustworthiness</article-title>
          <source>Assess Eval High Educ</source>
          <year>2025</year>
          <month>05</month>
          <day>13</day>
          <volume>50</volume>
          <issue>7</issue>
          <fpage>1</fpage>
          <lpage>16</lpage>
          <pub-id pub-id-type="doi">10.1080/02602938.2025.2502582</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ito</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ishibashi</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Hayashi</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kojima</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sogabe</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Large language models for the national radiological technologist licensure examination in Japan: cross-sectional comparative benchmarking and evaluation of model-generated items study</article-title>
          <source>JMIR Med Educ</source>
          <year>2025</year>
          <month>11</month>
          <day>13</day>
          <volume>11</volume>
          <fpage>e81807</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2025//e81807/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/81807</pub-id>
          <pub-id pub-id-type="medline">41232030</pub-id>
          <pub-id pub-id-type="pii">v11i1e81807</pub-id>
          <pub-id pub-id-type="pmcid">PMC12614397</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kaewboonlert</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Poontananggul</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pongsuwan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bhakdisongkhram</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Factors associated with the accuracy of large language models in basic medical science examinations: cross-sectional study</article-title>
          <source>JMIR Med Educ</source>
          <year>2025</year>
          <month>01</month>
          <day>13</day>
          <volume>11</volume>
          <fpage>e58898</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2025//e58898/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/58898</pub-id>
          <pub-id pub-id-type="medline">39846415</pub-id>
          <pub-id pub-id-type="pii">v11i1e58898</pub-id>
          <pub-id pub-id-type="pmcid">PMC11745146</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the performance of DeepSeek-R1 and DeepSeek-V3 Versus OpenAI models in the Chinese national medical licensing examination: cross-sectional comparative study</article-title>
          <source>JMIR Med Educ</source>
          <year>2025</year>
          <month>11</month>
          <day>14</day>
          <volume>11</volume>
          <fpage>e73469</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2025//e73469/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/73469</pub-id>
          <pub-id pub-id-type="medline">41237388</pub-id>
          <pub-id pub-id-type="pii">v11i1e73469</pub-id>
          <pub-id pub-id-type="pmcid">PMC12663704</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Performance evaluation and implications of large language models in radiology board exams: prospective comparative analysis</article-title>
          <source>JMIR Med Educ</source>
          <year>2025</year>
          <month>01</month>
          <day>16</day>
          <volume>11</volume>
          <fpage>e64284</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2025//e64284/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/64284</pub-id>
          <pub-id pub-id-type="medline">39819381</pub-id>
          <pub-id pub-id-type="pii">v11i1e64284</pub-id>
          <pub-id pub-id-type="pmcid">PMC11756834</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hattie</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Timperley</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>The power of feedback</article-title>
          <source>Rev Educ Res</source>
          <year>2007</year>
          <month>03</month>
          <day>01</day>
          <volume>77</volume>
          <issue>1</issue>
          <fpage>81</fpage>
          <lpage>112</lpage>
          <pub-id pub-id-type="doi">10.3102/003465430298487</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Miao</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Cukurova</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>AI competency framework for teachers</article-title>
          <source>UNESCO</source>
          <access-date>2025-09-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://unesdoc.unesco.org/ark:/48223/pf0000391104">https://unesdoc.unesco.org/ark:/48223/pf0000391104</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
