<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JME</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Educ</journal-id>
      <journal-title>JMIR Medical Education</journal-title>
      <issn pub-type="epub">2369-3762</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v12i1e76924</article-id>
      <article-id pub-id-type="pmid">42297358</article-id>
      <article-id pub-id-type="doi">10.2196/76924</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Tutorial</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Tutorial</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Developing a Large Language Model–Based Feedback System for Case Report Writing in Rehabilitation Education: Tutorial</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Leung</surname>
            <given-names>Tiffany</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Koda</surname>
            <given-names>Masahide</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Tonouchi</surname>
            <given-names>Yuuto</given-names>
          </name>
          <degrees>BScOT</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Rehabilitation</institution>
            <institution>Kyoto Min-iren Asukai Hospital</institution>
            <addr-line>89, Tanaka-asukai</addr-line>
            <addr-line>Sakyo-ku</addr-line>
            <addr-line>Kyoto, Kyoto, 606-8226</addr-line>
            <country>Japan</country>
            <fax>81 75 701 9183</fax>
            <phone>81 75 712 9091</phone>
            <email>yuuto.0901el7@gmail.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0009-4813-4829</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Nakai</surname>
            <given-names>Shunsuke</given-names>
          </name>
          <degrees>BScOT, DHSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0008-8775-0715</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Murakami</surname>
            <given-names>Kayo</given-names>
          </name>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0004-1516-8452</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Kataoka</surname>
            <given-names>Yuki</given-names>
          </name>
          <degrees>MD, MPH, DrPH</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <xref rid="aff5" ref-type="aff">5</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <xref rid="aff7" ref-type="aff">7</xref>
          <xref rid="aff8" ref-type="aff">8</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7982-5213</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Rehabilitation</institution>
        <institution>Kyoto Min-iren Asukai Hospital</institution>
        <addr-line>Kyoto, Kyoto</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Occupational Therapy</institution>
        <institution>Faculty of Rehabilitation</institution>
        <institution>Morinomiya University of Medical Sciences</institution>
        <addr-line>Osaka, Osaka</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Graduate School of Rehabilitation Science</institution>
        <institution>Osaka Metropolitan University</institution>
        <addr-line>Osaka, Osaka</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Center for Postgraduate Clinical Training and Career Development</institution>
        <institution>Nagoya University Hospital</institution>
        <addr-line>Nagoya, Aichi</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Center for Medical Education</institution>
        <institution>Graduate School of Medicine</institution>
        <institution>Nagoya University</institution>
        <addr-line>Nagoya, Aichi</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Department of Healthcare Epidemiology</institution>
        <institution>Graduate School of Medicine and Public Health</institution>
        <institution>Kyoto University</institution>
        <addr-line>Kyoto, Kyoto</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>Department of Systematic Reviewers</institution>
        <institution>Scientific Research Works Peer Support Group (SRWS-PSG)</institution>
        <addr-line>Osaka, Osaka</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff8">
        <label>8</label>
        <institution>Department of Internal Medicine</institution>
        <institution>Kyoto Min-iren Asukai Hospital</institution>
        <addr-line>Kyoto, Kyoto</addr-line>
        <country>Japan</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Yuuto Tonouchi <email>yuuto.0901el7@gmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2026</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>15</day>
        <month>6</month>
        <year>2026</year>
      </pub-date>
      <volume>12</volume>
      <elocation-id>e76924</elocation-id>
      <history>
        <date date-type="received">
          <day>12</day>
          <month>5</month>
          <year>2025</year>
        </date>
        <date date-type="rev-request">
          <day>9</day>
          <month>12</month>
          <year>2025</year>
        </date>
        <date date-type="accepted">
          <day>28</day>
          <month>5</month>
          <year>2026</year>
        </date>
      </history>
      <copyright-statement>©Yuuto Tonouchi, Shunsuke Nakai, Kayo Murakami, Yuki Kataoka. Originally published in JMIR Medical Education (https://mededu.jmir.org), 15.06.2026.</copyright-statement>
      <copyright-year>2026</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Education, is properly cited. The complete bibliographic information, a link to the original publication on https://mededu.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://mededu.jmir.org/2026/1/e76924" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Novice health care staff often write case reports during early clinical training. However, many institutions lack structured feedback systems because of time constraints and instructor shortages. Large language models, a form of artificial intelligence (AI), offer new opportunities to enhance educational feedback, yet their application in clinical training requires careful design to ensure pedagogically appropriate and ethically sound outputs.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This tutorial provides a practical guide for educators without programming experience to develop an AI-based feedback system using 3 accessible tools: Dify (an AI workflow platform), Slack (a messaging app), and Google Apps Script. The system balances educational quality with operational efficiency while incorporating data privacy safeguards for clinical educational content.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We developed a feedback system comprising 4 AI chatbots with 2 distinct approaches: “loop-based” bots that promote clinical reasoning through iterative, comment-based feedback and “single-shot” bots for efficient proofreading and summarization tasks. The tutorial describes the system architecture; feedback design principles grounded in formative assessment theory; a step-by-step implementation guide; and data privacy safeguards, including a deidentification protocol and application programming interface–based data protection measures. To illustrate feasibility, we conducted a pilot implementation at a community care hospital from April to June 2024, involving 5 novice staff members and 5 instructors.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>A pilot implementation at a community care hospital demonstrated that the system was feasible to deploy and operate within routine clinical education workflows. Participant feedback indicated high usability and suggested that the iterative, comment-based feedback approach supported learner engagement while also identifying areas where feedback criteria required refinement to better match institutional educational goals.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This tutorial provides a reproducible framework for building a customized AI feedback system that combines comment-based iterative feedback with human-in-the-loop oversight and a multilayered data privacy framework. By following this guide, educators can implement an adaptive system tailored to their institutional context and clinical domain.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>large language model</kwd>
        <kwd>education</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>AI</kwd>
        <kwd>rehabilitation</kwd>
        <kwd>case report</kwd>
        <kwd>feedback</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>In medical education, writing is not merely a record of clinical events but a vital learning activity that supports reflection and growth. Reflective writing (RW), including the reflective elements embedded in case report writing, fosters core competencies such as clinical reasoning and professional identity formation [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. However, writing becomes educationally meaningful only when feedback effectively guides learners toward explicit goals [<xref ref-type="bibr" rid="ref3">3</xref>]. Previous studies confirm that supportive, structured, and longitudinal feedback maximizes the impact of RW [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>].</p>
        <p>Delivering such feedback at scale faces persistent challenges in clinical settings. Time constraints and limited instructional skills often prevent adequate feedback [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. Consequently, this feedback loop frequently breaks down, hindering the professional development of novice staff.</p>
        <p>Large language models (LLMs) have demonstrated utility for feedback, clinical reasoning, and research assistance, including health care contexts [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref6">6</xref>]. A recent review suggests that artificial intelligence (AI) reduces workload and improves efficiency, particularly in medical writing and administrative support [<xref ref-type="bibr" rid="ref7">7</xref>]. These developments have increased interest in applying LLMs to educational feedback for RW.</p>
        <p>However, realizing this potential requires purpose-built systems that go beyond general-purpose chatbot interactions, along with careful consideration of data privacy. This tutorial addresses that gap.</p>
      </sec>
      <sec>
        <title>Aims and Target Audience</title>
        <p>This tutorial provides a practical guide for educators without programming experience to develop an AI-based feedback system for case report writing in clinical education. Specifically, it offers (1) a conceptual framework distinguishing custom AI systems from standard chatbot use, (2) a step-by-step implementation guide using 3 accessible tools (Dify [LangGenius, Inc]; Slack [Slack Technologies, LLC]; and Google Apps Script [GAS; Google LLC]), (3) ethical and data privacy guidelines for deploying AI in medical education settings, and (4) empirical evaluation data from a pilot implementation at a community care hospital.</p>
        <p>The primary audience is clinical educators who supervise novice staff writing case reports, experience time pressure when providing feedback, and lack programming expertise. Although the examples and prompts presented here focus on rehabilitation settings as a working illustration, educators in other medical fields can adapt this framework by modifying the prompts to suit their specific clinical domains and educational objectives.</p>
      </sec>
      <sec>
        <title>Rationale for a Customized System</title>
        <p>General-purpose chatbots (eg, a standard ChatGPT interface) pose substantial risks when used without customization in medical education. The medical domain requires specialized terminology and linguistic precision that general models may fail to process accurately [<xref ref-type="bibr" rid="ref8">8</xref>]. Effective AI use in medical education depends on strategic prompt design; poorly constructed instructions can yield inaccurate or unsafe outputs [<xref ref-type="bibr" rid="ref9">9</xref>]. Mastering such prompt design techniques requires technical expertise that most clinical educators do not possess [<xref ref-type="bibr" rid="ref9">9</xref>], making accessibility a core design requirement. These considerations led us to develop a customized system rather than rely on off-the-shelf chatbot interactions.</p>
        <p>Three requirements distinguish a custom educational system from standard chatbot use. First, standardization ensures fairness. In direct chatbot interaction, response quality depends entirely on the user’s prompting skills. Novice staff may receive suboptimal feedback simply due to limited prompting skills. A custom system uses preprogrammed instructions, known as meta-prompts (<xref ref-type="boxed-text" rid="box1">Textbox 1</xref>), to evaluate every draft against the same rubric, ensuring consistent feedback for all learners. Second, integration enables visibility and progress management. When novice staff use personal chatbot accounts, educators cannot monitor their interactions. Integrating the system into a shared workspace enables educators to transparently track progress and intervene when necessary. Third, centralized logging supports educational auditing. To improve the curriculum, educators need to identify common errors among novice staff. A custom system automatically records all interactions, generating valuable data for analyzing trends in learner performance.</p>
        <boxed-text id="box1" position="float">
          <title>Prompts vs meta-prompts (user input vs system instructions).</title>
          <p>This system distinguishes between 2 types of text inputs:</p>
          <list list-type="order">
            <list-item>
              <p>Prompts (user input): the text written by the novice staff (eg, “Here is my draft...”).</p>
            </list-item>
            <list-item>
              <p>Meta-prompts (system instruction): hidden instructions preset by the educator. This text contains the persona (eg, “You are a senior physical therapist”), the rubric, and formatting rules. Separating these components ensures that the artificial intelligence consistently functions as a trained instructor, regardless of what the novice staff member inputs.</p>
            </list-item>
          </list>
        </boxed-text>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Highlights</title>
        <p>This section is organized as follows. First, we describe the 3-component system architecture (Dify, Slack, and GAS) and the dataflow connecting them. Second, we present the feedback design principles and the specifications of 4 educational chatbots. Third, we provide a step-by-step implementation guide for reproducing the system. Fourth, we address ethical considerations and data privacy safeguards. Finally, we describe a pilot implementation conducted at a community care hospital to assess system usability and feasibility.</p>
      </sec>
      <sec>
        <title>System Architecture and Dataflow</title>
        <p><xref rid="figure1" ref-type="fig">Figure 1</xref> illustrates the operational workflow. From the novice staff’s perspective, the system provides a straightforward interaction: the novice staff tags the relevant bot in Slack (eg, @Discussion_Bot) and submits a draft text. The system processes the request and provides specific feedback within the same thread. The novice staff then revises the text and replies to the bot again. This iterative conversation continues until the draft meets the required standards. This workflow off-loads the time-consuming revision cycle to the AI, reserving human feedback for clinical validity and professional judgment.</p>
        <p>The system architecture consists of 3 components selected to enable implementation without advanced programming knowledge (<xref rid="figure2" ref-type="fig">Figure 2</xref>). Programming is a well-documented barrier for health care professionals seeking to develop AI applications [<xref ref-type="bibr" rid="ref10">10</xref>]. We therefore adopted an approach that does not require specialized programming expertise and uses the following 3 components: Dify, Slack, and GAS.</p>
        <p>Dify [<xref ref-type="bibr" rid="ref11">11</xref>] is an open-source LLM application development platform that serves as the system’s central processing engine. Hosted in the cloud, it receives user inputs, processes them through a predesigned workflow, and instructs the AI how to respond. Educators can build the AI’s reasoning process visually, without writing code. We selected Dify because it offered the most accessible visual interface among available open-source LLM workflow platforms, combined with built-in application programming interface (API) publishing and conversation logging. The free tier is suitable for initial testing but has limited message credits; a paid plan may be required for sustained use with multiple learners. Data sovereignty considerations are discussed in the Ethical Considerations and Data Privacy section.</p>
        <p>Slack [<xref ref-type="bibr" rid="ref12">12</xref>] serves as the interactive chat interface for novice staff. Its private channel structure enables educators to monitor all novice staff-AI interactions in real time and to communicate with novice staff within the same workspace. The free tier limits message history retention, which we addressed through automatic logging to Google Sheets via GAS.</p>
        <p>GAS functions as the technical bridge linking Slack and Dify, securely relaying messages between the 2 platforms. We chose GAS for its native integration with Google Workspace, enabling automatic logging to Google Sheets and administrator error notifications without additional infrastructure. Although Dify provides a built-in Slack plug-in for direct integration, it does not support the logging and oversight functions considered essential for educational management. When a novice staff sends a message on Slack, the data travels through GAS to reach Dify, and the response returns along the same path. Every interaction is automatically logged, visible to educators, and monitored for errors.</p>
        <p>A key design feature is the iterative pass or revise loop implemented within Dify’s Chatflow functionality (<xref rid="figure3" ref-type="fig">Figure 3</xref>). Unlike a simple chatbot that answers a question once, effective education requires iterative engagement [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. A recent Association for Medical Education in Europe guide indicates that continuous, formative feedback aligned with explicit learning objectives develops competencies more effectively than one-time summative evaluation [<xref ref-type="bibr" rid="ref14">14</xref>]. The system, therefore, implements a conditional workflow:</p>
        <list list-type="bullet">
          <list-item>
            <p>Analyze: the system evaluates the novice staff’s draft against the defined rubric.</p>
          </list-item>
          <list-item>
            <p>Decide the following:</p>
            <list list-type="bullet">
              <list-item>
                <p>If the draft meets the criteria, the system outputs “pass” and allows the novice staff to proceed.</p>
              </list-item>
              <list-item>
                <p>If not, the system outputs “revise,” provides targeted comments, and awaits the corrected draft.</p>
              </list-item>
            </list>
          </list-item>
          <list-item>
            <p>Repeat: this mechanism prevents novice staff from overlooking feedback and promotes iterative learning.</p>
          </list-item>
        </list>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Operational flow comparison. AI: artificial intelligence.</p>
          </caption>
          <graphic xlink:href="mededu_v12i1e76924_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Three-component system architecture. AI: artificial intelligence. LLM: large language model.</p>
          </caption>
          <graphic xlink:href="mededu_v12i1e76924_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Dify Chatflow for the conditional workflow. LLM: large language model.</p>
          </caption>
          <graphic xlink:href="mededu_v12i1e76924_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Feedback Design and Bot Specifications</title>
        <sec>
          <title>Overview</title>
          <p>The feedback design rests on 2 complementary principles: comment-based feedback and the human-in-the-loop approach.</p>
          <p>Comment-based feedback prioritizes written comments over direct correction. Research suggests that comments produce greater gains in writing proficiency than simple error location or direct correction [<xref ref-type="bibr" rid="ref13">13</xref>] because comments compel learners to actively process information and revise their own work [<xref ref-type="bibr" rid="ref14">14</xref>]. The system thus functions as an always-available virtual instructor, serving as a strict gatekeeper prior to human review. By off-loading the repetitive task of checking logical consistency and structure to the AI, educators can focus on the final clinical assessment.</p>
          <p>The human-in-the-loop approach ensures that educators retain final decision-making authority; AI serves only as a support tool. The AI focuses on overall structure, logical consistency, and writing style, while avoiding specific clinical judgments to mitigate the risk of hallucinations (ie, plausible but incorrect medical advice). This system does not evaluate clinical validity or refine medical discussions. Qualified educators must provide professional feedback on these aspects, and novice staff should treat AI feedback as suggestions for improving writing structure and logic, not as clinical guidance.</p>
          <p>On the basis of these principles, the system provides 4 distinct chatbots tailored to the report writing process (<xref ref-type="table" rid="table1">Table 1</xref>; refer to <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for detailed meta-prompts.) The system uses 2 distinct feedback approaches: a “loop-based” approach for iterative revision and a “single-shot” approach for efficient one-time processing.</p>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Specifications and logic of the 4 chatbots.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="240"/>
              <col width="370"/>
              <col width="390"/>
              <thead>
                <tr valign="top">
                  <td>Chatbot name and type</td>
                  <td>Primary function</td>
                  <td>Evaluation criteria or prompt elements</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Integration and interpretation bot (loop-based feedback)</td>
                  <td>Verifies clinical reasoning and checks consistency between assessment, problems, and goals.</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Passing criteria (checkpoints)</p>
                      </list-item>
                    </list>
                    <list list-type="bullet">
                      <list-item>
                        <p>Description of the clinical overview</p>
                      </list-item>
                      <list-item>
                        <p>Clarification of focal points and rationale</p>
                      </list-item>
                      <list-item>
                        <p>Identification of specific clinical problems</p>
                      </list-item>
                      <list-item>
                        <p>Alignment of assessment data with identified problems</p>
                      </list-item>
                      <list-item>
                        <p>Formulation of treatment plan and prognosis</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>Discussion bot (loop-based feedback)</td>
                  <td>Evaluates argumentation and checks if the argument logically supports the conclusion based on evidence.</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Passing criteria (checkpoints)</p>
                      </list-item>
                    </list>
                    <list list-type="bullet">
                      <list-item>
                        <p>Summary of key intervention outcomes</p>
                      </list-item>
                      <list-item>
                        <p>Integration of relevant literature and guidelines</p>
                      </list-item>
                      <list-item>
                        <p>Comparative analysis with previous studies and original conclusions</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>Proofreading bot (single-shot output)</td>
                  <td>Enhances text quality and acts as a domain-specific AI<sup>a</sup> editor to refine style and grammar for academic submission.</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Prompt elements</p>
                      </list-item>
                    </list>
                    <list list-type="bullet">
                      <list-item>
                        <p>Detect and correct typographical and grammatical errors</p>
                      </list-item>
                      <list-item>
                        <p>Standardize tone to formal academic style</p>
                      </list-item>
                      <list-item>
                        <p>Refine expressions for clarity and conciseness</p>
                      </list-item>
                      <list-item>
                        <p>Ensure logical consistency and readability</p>
                      </list-item>
                      <list-item>
                        <p>Strengthen paragraph coherence</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>Abstract summarization bot (single-shot output)</td>
                  <td>Generates structured summaries and condenses the case report into a format suitable for conference or journal abstract submission.</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Output specifications</p>
                      </list-item>
                    </list>
                    <list list-type="bullet">
                      <list-item>
                        <p>Generate a structured abstract text</p>
                      </list-item>
                      <list-item>
                        <p>Propose 2 candidate titles</p>
                      </list-item>
                      <list-item>
                        <p>Select 3 relevant keywords</p>
                      </list-item>
                      <list-item>
                        <p>Provide the final summarized text</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table1fn1">
                <p><sup>a</sup>AI: artificial intelligence.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
        <sec>
          <title>Loop-Based Chatbots</title>
          <p>The 2 loop-based chatbots promote clinical reasoning through iterative, comment-based feedback:</p>
          <list list-type="bullet">
            <list-item>
              <p>Integration and interpretation bot: verifies clinical reasoning by checking the logical consistency between assessment results, the problem list, and goal setting. The bot prompts revisions until all logical checkpoints are met.</p>
            </list-item>
            <list-item>
              <p>Discussion bot: evaluates whether the argument aligns with the interpretation and logically supports the conclusion. The bot prompts revisions until all checkpoints are satisfied.</p>
            </list-item>
          </list>
        </sec>
        <sec>
          <title>Single-Shot Chatbots</title>
          <p>The 2 single-shot chatbots perform efficient, single-pass tasks:</p>
          <list list-type="bullet">
            <list-item>
              <p>Proofreading bot: corrects grammatical errors and improves clarity without altering the clinical meaning. It generates a polished draft in a single interaction.</p>
            </list-item>
            <list-item>
              <p>Abstract summarization bot: produces a concise summary of the completed case report in a format suitable for conference or journal submission.</p>
            </list-item>
          </list>
        </sec>
      </sec>
      <sec>
        <title>Step-By-Step Implementation</title>
        <sec>
          <title>Overview</title>
          <p>This guide enables educators to build the system by following step-by-step instructions and copying the provided resources; no complex coding is required. The following subsections outline the role of each component and the key actions involved. Detailed instructions, including specific platform operations, configuration values, and troubleshooting guidance, are provided in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
        </sec>
        <sec>
          <title>Prerequisites: Accounts and API Keys</title>
          <p>Ensure the following are ready before starting:</p>
          <list list-type="bullet">
            <list-item>
              <p>Dify account: (cloud version or self-hosted)</p>
            </list-item>
            <list-item>
              <p>Slack workspace: (educators need permission to create apps and add bots)</p>
            </list-item>
            <list-item>
              <p>Google account: (to access Google Drive and Sheets)</p>
            </list-item>
            <list-item>
              <p>API keys: an API key from an LLM provider (eg, OpenAI API key or Anthropic API key; <xref ref-type="boxed-text" rid="box2">Textbox 2</xref>).</p>
            </list-item>
          </list>
          <boxed-text id="box2" position="float">
            <title>Understanding application programming interface (APIs) and API keys.</title>
            <list list-type="bullet">
              <list-item>
                <p>What is an API? An API is a set of rules that allows different software systems to communicate. It acts as a standardized bridge, sending a digital request from your system to the artificial intelligence (AI) service and returning the response. This allows your application to use powerful external AI capabilities without hosting the underlying technology locally.</p>
              </list-item>
              <list-item>
                <p>What is an API key? An API key is a unique string of characters that acts as a digital ID card (authentication token). When Dify sends a request to a large language model provider (such as OpenAI), it uses this key to verify the user’s identity and link use to a specific billing account. Warning: never share this key publicly. If compromised, unauthorized users may incur charges against your account.</p>
              </list-item>
            </list>
          </boxed-text>
        </sec>
        <sec>
          <title>Setting Up Dify</title>
          <p>Dify serves as the AI processing engine. Implementation involves creating a new Chatflow-type application, importing the feedback workflow via the domain-specific language file (<xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>), registering the LLM API key, and adjusting the meta-prompts to suit the target clinical domain. Once published, Dify generates an API key for use in subsequent integration steps.</p>
        </sec>
        <sec>
          <title>Creating the Slack Application</title>
          <p>After configuring Dify, the next step is to create the bot account in Slack. This involves registering a new app in the Slack API console, assigning the minimum necessary permissions (eg, reading messages, sending replies), and installing the bot in the target workspace. The resulting bot token is required for the integration step.</p>
        </sec>
        <sec>
          <title>Configuring GAS</title>
          <p>Dify handles the AI logic, and Slack provides the chat interface, but the 2 platforms cannot communicate directly. GAS serves as the bridge connecting them. Implementation involves creating a GAS project, deploying the relay script (<xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>), and securely storing the API credentials from the previous steps as script properties. The script is then deployed as a web application so that Slack can send messages to it.</p>
        </sec>
        <sec>
          <title>Final Configuration and Verification</title>
          <p>The final step links all 3 components and verifies system function. Configuring Slack’s event subscriptions feature to forward messages to the GAS end point completes the communication loop. A test message sent in Slack should trigger the full pipeline: Slack receives the message, GAS relays it to Dify, the LLM generates feedback, and the response returns to Slack while being logged in Google Sheets.</p>
        </sec>
      </sec>
      <sec>
        <title>Data Privacy</title>
        <p>Because this system transmits case report content through multiple external platforms, safeguarding protected health information (PHI) is essential. This section describes the data protection measures organized into 3 categories: administrative, technical, and supervisory safeguards.</p>
        <sec>
          <title>Administrative Safeguards</title>
          <p>Before submitting any draft to the system, novice staff must deidentify all patient information following the anonymization standards recommended by the International Committee of Medical Journal Editors [<xref ref-type="bibr" rid="ref15">15</xref>]. The deidentification protocol involves 2 steps:</p>
          <list list-type="order">
            <list-item>
              <p>Remove all direct identifiers: patient names, medical record numbers, dates of birth, addresses, and contact information.</p>
            </list-item>
            <list-item>
              <p>Generalize quasi-identifiers to prevent reidentification through combination: convert specific dates to relative timelines (eg, “Day 1 of admission” rather than a calendar date), express exact ages in decade ranges (eg, “a patient in their 80s”), and replace facility names with generic descriptors (eg, “a community rehabilitation hospital”).</p>
            </list-item>
          </list>
          <p>In the pilot implementation, we provided deidentification training to all participants prior to system use (refer to the Ethical Considerations section). Each novice staff member received individual instruction on the protocol, supplemented by a short instructional video demonstrating the 2-step process with concrete examples from rehabilitation case reports. We reinforced compliance through ongoing supervision during the pilot period.</p>
        </sec>
        <sec>
          <title>Technical Safeguards</title>
          <p>All communication with LLMs in this system occurs exclusively through the API, not through consumer-facing chat interfaces such as ChatGPT (OpenAI) or Claude.ai (Anthropic). This architectural choice provides a contractual safeguard: both OpenAI and Anthropic explicitly state in their API terms of service that data submitted through the API are not used to train or improve their models [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. Both OpenAI and Anthropic retain API data for up to 30 days solely for abuse monitoring purposes, after which it is automatically deleted. Because data submitted to LLM providers cannot be recalled during this retention window, deidentification prior to submission constitutes the critical safeguard.</p>
          <p>To provide a transparent risk assessment, we trace the complete data path (<xref rid="figure4" ref-type="fig">Figure 4</xref>). When a novice staff submits a message in Slack, the data traverses 5 external nodes before a response is returned:</p>
          <list list-type="order">
            <list-item>
              <p>Slack servers: Slack stores messages with encryption; access is restricted to invited channel members.</p>
            </list-item>
            <list-item>
              <p>GAS: GAS processes data transiently during relay without persistent storage.</p>
            </list-item>
            <list-item>
              <p>Google Sheets: conversation logs are persistently stored for educational analysis, with access restricted to designated administrators.</p>
            </list-item>
            <list-item>
              <p>Dify Cloud: conversation logs are retained within the platform and are accessible only to the system administrator.</p>
            </list-item>
            <list-item>
              <p>LLM API end point (OpenAI or Anthropic): the LLM provider processes data and retains it for up to 30 days under the nontraining policies described above.</p>
            </list-item>
          </list>
          <p>For institutions requiring full data sovereignty, Dify offers a self-hosted deployment option that retains all data within the institution’s own infrastructure, though this requires server infrastructure and technical expertise.</p>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>Dataflow and privacy safeguards across the 5 system nodes. API: application programming interface; LLM: large language model.</p>
            </caption>
            <graphic xlink:href="mededu_v12i1e76924_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Real-Time Oversight and Incident Response</title>
          <p>The system architecture supports real-time oversight. Because all interactions occur in shared Slack channels, educators can continuously monitor both novice staff submissions and AI responses, enabling immediate detection of any inadvertent PHI disclosure. The Google Sheets log provides a persistent, searchable record for periodic auditing. If PHI is inadvertently submitted, educators can take the following remediation steps:</p>
          <list list-type="bullet">
            <list-item>
              <p>Delete the PHI-containing message from Slack.</p>
            </list-item>
            <list-item>
              <p>Remove the corresponding row from the Google Sheets log.</p>
            </list-item>
            <list-item>
              <p>Purge the conversation log from the Dify platform.</p>
            </list-item>
            <list-item>
              <p>The LLM provider automatically deletes data within the 30-day retention window.</p>
            </list-item>
          </list>
          <p>The current system does not include automated PHI detection prior to submission; deidentification relies on the administrative safeguards described above. We identify the development of automated presubmission screening as a priority for future implementations (refer to the limitations and future directions section).</p>
        </sec>
        <sec>
          <title>Transparency, Consent, and Scope of AI Feedback</title>
          <p>Transparency is foundational to ethical AI adoption. Before introducing the system, educators should clearly explain to novice staff that they are communicating with an AI system and how their data will be processed. Educators should also define the system as an educational support tool for facilitating the drafting process, rather than a replacement for human supervision or a formal assessment of clinical capabilities.</p>
          <p>To manage the risk of hallucinations, the system uses 2 strategies. First, the AI’s feedback includes a disclaimer: “AI can make mistakes. Always verify medical facts with your supervisor.” Second, the AI’s role is limited to structural and logical feedback rather than clinical diagnosis, reducing the risk of harmful errors.</p>
        </sec>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>The ethics committee of Kyoto Min-iren Asukai Hospital approved this pilot evaluation (2024-0502). All participating staff members received verbal and written explanations of the study’s purpose and data handling procedures, and provided written informed consent. We explained deidentification requirements to all novice staff members individually and reinforced them through an instructional video prior to system use. For past case reports used in meta-prompt tuning, we implemented an opt-out procedure. Participants received no financial compensation.</p>
      </sec>
      <sec>
        <title>Iterative Development Process</title>
        <p>The current Dify-based system evolved through iterative refinement of an earlier prototype. The initial version used a single-prompt chatbot approach. Early testing revealed 2 challenges: a ceiling effect in which most novice staff passed all checkpoints on their first submission, indicating that the meta-prompts were too lenient for meaningful learning, and declining instruction adherence as prompt length increased. These issues motivated the transition to the Dify-based Chatflow architecture, which evaluates checkpoints sequentially and allows educators to adjust passing criteria through its visual interface.</p>
        <p>Some instructors also expressed concern that overreliance on AI feedback could diminish clinical reasoning skills. We therefore designed the system to limit AI feedback to structural and logical aspects and to prompt learners to reconsider their own reasoning rather than providing corrected example text.</p>
      </sec>
      <sec>
        <title>Pilot Implementation</title>
        <p>To inform the design and iterative refinement of this tutorial, we conducted a single-center pilot implementation at Kyoto Min-iren Asukai Hospital. This pilot used a prototype version with direct Slack-GAS-AI integration prior to the introduction of Dify. Because the user interface (Slack) and the fundamental feedback logic (iterative revisions) remained identical, the usability data are directly applicable to the Dify-based system.</p>
        <p>Five novice rehabilitation staff members (3 physiotherapists and 2 occupational therapists) who joined in April 2024 and 5 educational instructors participated. The pilot ran from April to June 2024. Prior to this pilot, the facility had not used Slack for official communication; thus, this pilot represented the participants’ first experience with the platform. During the pilot, participants tagged the specific bot (eg, “@Integration_Bot”) in Slack to initiate iterative feedback on structure and logic. Once the content was finalized, they used the “@Proofreading_Bot” for grammatical corrections before submitting the final draft to their human supervisors.</p>
        <p>We collected data through 2 methods. First, postimplementation surveys via Google Forms assessed the system’s usability and acceptance. Novice staff completed the System Usability Scale [<xref ref-type="bibr" rid="ref18">18</xref>] and rated the appropriateness of the AI feedback content. The System Usability Scale is a standardized 10-item questionnaire for measuring system usability. Scores above 68 indicate above-average usability, and scores above 85 indicate excellent usability. Instructors assessed changes in instructional efficiency and feedback appropriateness. Second, we analyzed use logs from the Slack-linked spreadsheet, including use frequency, revision counts per task, and the content of feedback.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>This section describes the pilot implementation experience, which informed the iterative refinement and final design of this tutorial.</p>
      <p>The postimplementation survey response rate was 100% (5/5) for both instructors and novice staff. Detailed survey results are provided in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>.</p>
      <p>Novice staff found the system accessible, with a median System Usability Scale score of 90 (range 70-95), confirming that the approach lowered the barrier to adoption. All 5 staff members reported that the AI feedback was helpful for their learning (median 5, range 4-5). Instructor feedback identified areas where the tutorial framework requires further customization: while 80% (4/5) of staff members anticipated a reduction in future instructional burden (median 4, range 1-5), ratings for the appropriateness of AI feedback content were moderate (median 3, range 1-4), suggesting that the balance between structural feedback and clinical depth needs institution-specific calibration.</p>
      <p>Log analysis confirmed that all 5 novice staff members actively used the system. Typically, they used the integration and interpretation bot 1 to 2 times and the proofreading bot once per report.</p>
      <p>Qualitative feedback from novice staff highlighted the psychological benefits of the system, with comments such as “My mental burden is reduced because I can get feedback before showing it to a human”. Instructors acknowledged efficiency gains, noting the ability to “focus on specialized feedback”. However, some instructors expressed concern that reliance on the system could lead to a decline in writing skills and clinical reasoning abilities.</p>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This tutorial presents a practical framework for building an LLM-based feedback system for case report writing in clinical education. The principal contribution is demonstrating that educators can construct a customized AI feedback system by combining 3 accessible tools (Dify, Slack, and GAS) while maintaining educational quality and data privacy.</p>
        <p>The system embodies 2 key design principles. First, comment-based iterative feedback encourages active revision rather than passive correction, preserving the cognitive effort essential for developing clinical reasoning skills [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. Second, the human-in-the-loop principle limits AI to structural and logical evaluation, reserving clinical validity assessment for qualified educators and mitigating the risk of unwarranted clinical authority [<xref ref-type="bibr" rid="ref19">19</xref>].</p>
        <p>The pilot implementation experience supported the design decisions underlying this tutorial. In particular, the transition from the prototype to the Dify-based architecture was directly motivated by 2 challenges observed during early testing: a ceiling effect indicating that initial meta-prompts were insufficiently stringent and declining instruction adherence as prompt complexity increased. These observations illustrate a core advantage of the framework presented here: educators can iteratively adjust passing criteria and feedback logic through Dify’s visual interface, enabling continuous adaptation without programming expertise.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>To our knowledge, few studies have provided practical, reproducible guidance for clinical educators to build customized LLM-based feedback systems. Systematic reviews of LLMs in medical education have predominantly identified studies evaluating LLM performance on examinations and clinical knowledge assessments, with very few reporting empirical implementation research [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. Practical programming-free AI development guides in health care have focused on other domains, such as image classification [<xref ref-type="bibr" rid="ref10">10</xref>], and exploratory studies in adjacent fields have examined similar accessible tools for providing formative feedback on student writing [<xref ref-type="bibr" rid="ref22">22</xref>]. A step-by-step guide for building an LLM-based formative feedback system for clinical writing education has not been described. This tutorial addresses that gap.</p>
        <p>The design principle of delegating structural and logical review to AI while reserving clinical judgment for educators reflects an emerging model in which AI supports, rather than replaces, expert judgment [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. Prior studies on the use of AI in education have reported reductions in teachers’ workload and stress, along with improvements in instructional efficiency [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. The pilot findings were consistent: instructors reported the ability to “focus on specialized feedback” rather than routine text review. This division of labor may offer a scalable approach to feedback delivery in resource-constrained educational settings.</p>
        <p>Accessibility was a key design consideration. Prior research indicates that AI-based educational tools positively influence learning efficiency and cognitive motivation [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. The pilot results supported this, with high usability ratings achieved even among staff with no prior experience using the chat platform.</p>
        <p>This tutorial demonstrates that rubric-based LLM evaluation can be customized for domain-specific educational purposes without programming expertise. Although the potential of AI as a writing support tool is well documented [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>] and LLMs can reliably evaluate clinical writing against structured rubrics [<xref ref-type="bibr" rid="ref28">28</xref>], these capabilities have typically required programming expertise, limiting accessibility for clinical educators.</p>
        <p>Overreliance on AI feedback poses recognized risks, including cognitive deskilling and diminished independent reasoning [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. A recent scoping review of ethical challenges in AI-assisted medical education underscores the need for hybrid learning models that balance AI assistance with traditional teaching [<xref ref-type="bibr" rid="ref19">19</xref>]. This tutorial addresses these concerns through the human-in-the-loop principle: the system limits AI feedback to structural and logical aspects, and all AI-generated comments include disclaimers directing novice staff to verify content with their supervisors.</p>
      </sec>
      <sec>
        <title>Limitations and Future Directions</title>
        <p>This tutorial and its pilot evaluation have several limitations. First, the small sample size (5 novice staff and 5 instructors) limits causal inference. Second, as a single-center pilot, future research should involve multicenter collaborative studies. Third, the outcomes relied on subjective questionnaires. Future studies should analyze quantitative data such as the duration of instructor guidance and use independent reviewers to evaluate report quality objectively. Fourth, although we provided deidentification training through individual instruction and an instructional video, the pilot did not include an automated presubmission PHI detection mechanism. Recent studies have demonstrated that LLM-based systems can analyze conversation data while preserving privacy [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
        <p>No incidents of PHI disclosure were identified during the pilot period, suggesting that the current approach, which aligns with standard security practices for cloud-based services, was sufficient within this controlled setting. However, future implementations should strengthen compliance through additional safeguards: supervisor-led presubmission review, prioritization of hypothetical cases during early adoption, and development of automated PHI detection systems. In contexts requiring stricter data governance, locally hosted LLMs may also be considered.</p>
        <p>Two broader considerations apply to the adoption of this approach. The system relies on cloud-based services, which may not meet the data sovereignty requirements of all institutions. Additionally, because LLM capabilities and API policies evolve rapidly, educators should monitor LLM provider updates regarding data handling practices and model performance. Furthermore, while this tutorial provides detailed implementation instructions and reproducible resources, the step-by-step guide has not yet been independently tested by educators outside the development team.</p>
        <p>Future directions include broader validation of the tutorial’s reproducibility across diverse clinical settings, development of automated PHI detection as a presubmission safeguard, and investigation of the system’s long-term impact on writing proficiency and clinical reasoning development.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This tutorial provides a reproducible guide for building a case report feedback system using Dify and Slack without programming expertise. The architecture enables educators to fine-tune AI logic through visual interfaces, separating AI reasoning from software code. The tutorial also addresses data privacy considerations for deploying AI systems that handle clinical educational content. By emphasizing human oversight at every stage and iterative refinement of feedback criteria, this framework supports educators in adapting the system to their institutional context and evolving educational needs.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Meta-prompts used in the system.</p>
        <media xlink:href="mededu_v12i1e76924_app1.docx" xlink:title="DOCX File , 44 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Step-by-step implementation guide.</p>
        <media xlink:href="mededu_v12i1e76924_app2.docx" xlink:title="DOCX File , 25 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Dify domain-specific language file (importable file for reproduction).</p>
        <media xlink:href="mededu_v12i1e76924_app3.zip" xlink:title="ZIP File  (Zip Archive), 23 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Google Apps Script code.</p>
        <media xlink:href="mededu_v12i1e76924_app4.txt" xlink:title="TXT File , 7 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Detailed questionnaire results.</p>
        <media xlink:href="mededu_v12i1e76924_app5.docx" xlink:title="DOCX File , 29 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">API</term>
          <def>
            <p>application programming interface</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">GAS</term>
          <def>
            <p>Google Apps Script</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">PHI</term>
          <def>
            <p>protected health information</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">RW</term>
          <def>
            <p>reflective writing</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors thank the rehabilitation staff at Kyoto Min-iren Asukai Hospital for their assistance in this project. During the preparation of this manuscript, the authors used Claude Opus 4.6 (Anthropic [<xref ref-type="bibr" rid="ref17">17</xref>]) and Gemini 3.1 Pro (Google [<xref ref-type="bibr" rid="ref32">32</xref>]) for the following purposes: drafting and editing assistance, literature search and information gathering, structural planning and outline development, and English language refinement. The authors reviewed, verified, and edited all artificial intelligence–generated content and take full responsibility for the accuracy and integrity of the final manuscript.</p>
    </ack>
    <notes>
      <sec>
        <title>Funding</title>
        <p>The application programming interface use fee for the pilot implementation was supported by a research fund from the Scientific Research Works Peer Support Group awarded to YK. The costs for the latest system development and article processing charges were covered by a 2025 research grant from the Shinohara Foundation. The funders had no role in the project design, data collection and analysis, decision to publish, or preparation of the manuscript.</p>
      </sec>
    </notes>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The data supporting the findings of this work, including the developed meta-prompts and codes, are available in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendices 1</xref> and <xref ref-type="supplementary-material" rid="app3">3</xref>-<xref ref-type="supplementary-material" rid="app5">5</xref>. All other data are available upon request from the corresponding author.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>Conceptualization: YT, YK</p>
        <p>Funding acquisition: YT, YK</p>
        <p>Investigation: YT, SN, KM</p>
        <p>Methodology: YT, YK</p>
        <p>Project administration: YT</p>
        <p>Resources: YT, YK</p>
        <p>Supervision: YK</p>
        <p>Validation: YT, SN, KM</p>
        <p>Writing – original draft: YT</p>
        <p>Writing – review &#38; editing: YT, SN, KM, YK</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Artioli</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Deiana</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>De Vincenzo</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Raucci</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Amaducci</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bassi</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Di Leo</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hayter</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ghirotto</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Health professionals and students' experiences of reflective writing in learning: a qualitative meta-synthesis</article-title>
          <source>BMC Med Educ</source>
          <year>2021</year>
          <month>07</month>
          <day>22</day>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>394</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmededuc.biomedcentral.com/articles/10.1186/s12909-021-02831-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12909-021-02831-4</pub-id>
          <pub-id pub-id-type="medline">34294058</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12909-021-02831-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC8299581</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>JY</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>CY</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>So</surname>
              <given-names>WZ</given-names>
            </name>
            <name name-style="western">
              <surname>Tey</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lam</surname>
              <given-names>YX</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>YX</given-names>
            </name>
            <name name-style="western">
              <surname>Tay</surname>
              <given-names>RY</given-names>
            </name>
            <name name-style="western">
              <surname>Leong</surname>
              <given-names>IT</given-names>
            </name>
            <name name-style="western">
              <surname>Rahman</surname>
              <given-names>ND</given-names>
            </name>
            <name name-style="western">
              <surname>Chiam</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Phua</surname>
              <given-names>GL</given-names>
            </name>
            <name name-style="western">
              <surname>Murugam</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>EK</given-names>
            </name>
            <name name-style="western">
              <surname>Krishna</surname>
              <given-names>LK</given-names>
            </name>
          </person-group>
          <article-title>A systematic scoping review of reflective writing in medical education</article-title>
          <source>BMC Med Educ</source>
          <year>2023</year>
          <month>01</month>
          <day>09</day>
          <volume>23</volume>
          <issue>1</issue>
          <fpage>12</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmededuc.biomedcentral.com/articles/10.1186/s12909-022-03924-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12909-022-03924-4</pub-id>
          <pub-id pub-id-type="medline">36624494</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12909-022-03924-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC9830881</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Burgess</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>van Diggele</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mellis</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Feedback in the clinical setting</article-title>
          <source>BMC Med Educ</source>
          <year>2020</year>
          <month>12</month>
          <day>03</day>
          <volume>20</volume>
          <issue>Suppl 2</issue>
          <fpage>460</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmededuc.biomedcentral.com/articles/10.1186/s12909-020-02280-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12909-020-02280-5</pub-id>
          <pub-id pub-id-type="medline">33272265</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12909-020-02280-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC7712594</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tsai</surname>
              <given-names>YS</given-names>
            </name>
            <name name-style="western">
              <surname>Gašević</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Can large language models provide feedback to students? A case study on ChatGPT</article-title>
          <source>Proceedings of the 2023 IEEE International Conference on Advanced Learning Technologies</source>
          <year>2023</year>
          <conf-name>ICALT 2023</conf-name>
          <conf-date>July 10-13, 2023</conf-date>
          <conf-loc>Orem, UT</conf-loc>
          <pub-id pub-id-type="doi">10.1109/icalt58122.2023.00100</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>DY</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Vodrahalli</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>McFarland</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Can large language models provide useful feedback on research papers? A large-scale empirical analysis</article-title>
          <source>NEJM AI</source>
          <year>2024</year>
          <month>07</month>
          <day>25</day>
          <volume>1</volume>
          <issue>8</issue>
          <pub-id pub-id-type="doi">10.1056/AIoa2400196</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rossettini</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Cook</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Palese</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pillastrini</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Turolla</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Pros and cons of using artificial intelligence chatbots for musculoskeletal rehabilitation management</article-title>
          <source>J Orthop Sports Phys Ther</source>
          <year>2023</year>
          <month>12</month>
          <volume>53</volume>
          <issue>12</issue>
          <fpage>728</fpage>
          <lpage>34</lpage>
          <pub-id pub-id-type="doi">10.2519/jospt.2023.12000</pub-id>
          <pub-id pub-id-type="medline">37707390</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>YG</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Qiu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Qian</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Lei</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>YD</given-names>
            </name>
          </person-group>
          <article-title>The application of large language models in medicine: a scoping review</article-title>
          <source>iScience</source>
          <year>2024</year>
          <month>4</month>
          <day>23</day>
          <volume>27</volume>
          <issue>5</issue>
          <fpage>109713</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2589-0042(24)00935-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.isci.2024.109713</pub-id>
          <pub-id pub-id-type="medline">38746668</pub-id>
          <pub-id pub-id-type="pii">S2589-0042(24)00935-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC11091685</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Heston</surname>
              <given-names>TF</given-names>
            </name>
            <name name-style="western">
              <surname>Khun</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Prompt engineering in medical education</article-title>
          <source>Int Med Educ</source>
          <year>2023</year>
          <month>08</month>
          <day>31</day>
          <volume>2</volume>
          <issue>3</issue>
          <fpage>198</fpage>
          <lpage>205</lpage>
          <pub-id pub-id-type="doi">10.3390/ime2030019</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zaghir</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Naguib</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bjelogrlic</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Névéol</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tannier</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Lovis</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Prompt engineering paradigms for medical applications: scoping review</article-title>
          <source>J Med Internet Res</source>
          <year>2024</year>
          <month>9</month>
          <day>10</day>
          <volume>26</volume>
          <fpage>e60501</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2024//e60501/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/60501</pub-id>
          <pub-id pub-id-type="medline">39255030</pub-id>
          <pub-id pub-id-type="pii">v26i1e60501</pub-id>
          <pub-id pub-id-type="pmcid">PMC11422740</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hoseini</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Dewar</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Empowering healthcare professionals with no-code artificial intelligence platforms for model development, a practical demonstration for pathology</article-title>
          <source>Discoveries (Craiova)</source>
          <year>2024</year>
          <month>03</month>
          <day>30</day>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>e182</fpage>
          <pub-id pub-id-type="doi">10.15190/d.2024.1</pub-id>
          <pub-id pub-id-type="medline">39734805</pub-id>
          <pub-id pub-id-type="pii">296</pub-id>
          <pub-id pub-id-type="pmcid">PMC11682784</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="web">
          <source>Dify</source>
          <access-date>2026-06-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dify.ai/">https://dify.ai/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="web">
          <source>Slack</source>
          <access-date>2026-06-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://slack.com/">https://slack.com/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Biber</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Nekrasova</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Horn</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>The effectiveness of feedback for L1-english and L2-writing development: a meta-analysis</article-title>
          <source>ETS Res Rep Ser</source>
          <year>2014</year>
          <month>08</month>
          <day>08</day>
          <volume>2011</volume>
          <issue>1</issue>
          <fpage>i</fpage>
          <lpage>99</lpage>
          <pub-id pub-id-type="doi">10.1002/j.2333-8504.2011.tb02241.x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lipnevich</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Mattern</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Feddock</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Formative assessment and feedback in medical education: a practical guide: AMEE guide no. 189</article-title>
          <source>Med Teach</source>
          <year>2025</year>
          <month>10</month>
          <day>24</day>
          <volume>48</volume>
          <issue>6</issue>
          <fpage>921</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.1080/0142159x.2025.2569623</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="web">
          <source>International Committee of Medical Journal Editors</source>
          <access-date>2026-06-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.ICMJE.org">http://www.ICMJE.org</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="web">
          <article-title>Data controls in the OpenAI platform</article-title>
          <source>OpenAI</source>
          <access-date>2026-05-31</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://platform.openai.com/docs/guides/your-data">https://platform.openai.com/docs/guides/your-data</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="web">
          <article-title>Is my data used for model training?</article-title>
          <source>Anthropic</source>
          <access-date>2026-05-31</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://privacy.claude.com/en/articles/7996868-is-my-data-used-for-model-training">https://privacy.claude.com/en/articles/7996868-is-my-data-used-for-model-training</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brooke</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>SUS: a 'quick and dirty' usability scale</article-title>
          <source>Usability Evaluation in Industry</source>
          <year>1996</year>
          <publisher-loc>Boca Raton, FL</publisher-loc>
          <publisher-name>CRC Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>The ethical challenges in the integration of artificial intelligence and large language models in medical education: a scoping review</article-title>
          <source>PLoS One</source>
          <year>2025</year>
          <month>10</month>
          <day>22</day>
          <volume>20</volume>
          <issue>10</issue>
          <fpage>e0333411</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0333411"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0333411</pub-id>
          <pub-id pub-id-type="medline">41124146</pub-id>
          <pub-id pub-id-type="pii">PONE-D-25-17270</pub-id>
          <pub-id pub-id-type="pmcid">PMC12543126</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lucas</surname>
              <given-names>HC</given-names>
            </name>
            <name name-style="western">
              <surname>Upperman</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Robinson</surname>
              <given-names>JR</given-names>
            </name>
          </person-group>
          <article-title>A systematic review of large language models and their implications in medical education</article-title>
          <source>Med Educ</source>
          <year>2024</year>
          <month>11</month>
          <volume>58</volume>
          <issue>11</issue>
          <fpage>1276</fpage>
          <lpage>85</lpage>
          <pub-id pub-id-type="doi">10.1111/medu.15402</pub-id>
          <pub-id pub-id-type="medline">38639098</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aster</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Laupichler</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Rockwell-Kollmann</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Masala</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bala</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Raupach</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT and other large language models in medical education - scoping literature review</article-title>
          <source>Med Sci Educ</source>
          <year>2024</year>
          <month>11</month>
          <day>13</day>
          <volume>35</volume>
          <issue>1</issue>
          <fpage>555</fpage>
          <lpage>67</lpage>
          <pub-id pub-id-type="doi">10.1007/s40670-024-02206-6</pub-id>
          <pub-id pub-id-type="medline">40144083</pub-id>
          <pub-id pub-id-type="pii">2206</pub-id>
          <pub-id pub-id-type="pmcid">PMC11933646</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Venter</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Coetzee</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Schmulian</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Exploring the use of artificial intelligence (AI) in the delivery of effective feedback</article-title>
          <source>Assess Eval High Educ</source>
          <year>2024</year>
          <month>10</month>
          <day>20</day>
          <volume>50</volume>
          <issue>4</issue>
          <fpage>516</fpage>
          <lpage>36</lpage>
          <pub-id pub-id-type="doi">10.1080/02602938.2024.2415649</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Younas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Subramanian</surname>
              <given-names>KP</given-names>
            </name>
            <name name-style="western">
              <surname>Haziazi</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Hussainy</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Kindi</surname>
              <given-names>AN</given-names>
            </name>
          </person-group>
          <article-title>A review on implementation of artificial intelligence in education</article-title>
          <source>Int J Res Innov Soc Sci</source>
          <year>2023</year>
          <month>09</month>
          <day>14</day>
          <volume>VII</volume>
          <issue>VIII</issue>
          <fpage>1092</fpage>
          <lpage>100</lpage>
          <pub-id pub-id-type="doi">10.47772/IJRISS.2023.7886</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kasneci</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Sessler</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Küchemann</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bannert</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dementieva</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Fischer</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Gasser</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Groh</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Günnemann</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hüllermeier</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Krusche</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kutyniok</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Michaeli</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Nerdel</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Pfeffer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Poquet</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Sailer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidt</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Seidel</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Stadler</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Weller</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kuhn</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kasneci</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT for good? On opportunities and challenges of large language models for education</article-title>
          <source>Learn Individ Differ</source>
          <year>2023</year>
          <month>04</month>
          <volume>103</volume>
          <fpage>102274</fpage>
          <pub-id pub-id-type="doi">10.1016/j.lindif.2023.102274</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meyer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jansen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Schiller</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Liebenow</surname>
              <given-names>LW</given-names>
            </name>
            <name name-style="western">
              <surname>Steinbach</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Horbach</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fleckenstein</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Using LLMs to bring evidence-based feedback into the classroom: AI-generated feedback increases secondary students’ text revision, motivation, and positive emotions</article-title>
          <source>Comput Educ Artif Intell</source>
          <year>2024</year>
          <month>06</month>
          <volume>6</volume>
          <fpage>100199</fpage>
          <pub-id pub-id-type="doi">10.1016/j.caeai.2023.100199</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>WL</given-names>
            </name>
            <name name-style="western">
              <surname>Koussayer</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Sujka</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT: friend or foe in medical writing? An example of how ChatGPT can be utilized in writing case reports</article-title>
          <source>Surg Pract Sci</source>
          <year>2023</year>
          <month>6</month>
          <day>2</day>
          <volume>14</volume>
          <fpage>100185</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2666-2620(23)00031-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.sipas.2023.100185</pub-id>
          <pub-id pub-id-type="medline">39845855</pub-id>
          <pub-id pub-id-type="pii">S2666-2620(23)00031-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC11749974</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abd-Alrazaq</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>AlSaad</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Alhuwail</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Healy</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Latifi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Aziz</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Damseh</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Alabed Alrazak</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sheikh</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Large language models in medical education: opportunities, challenges, and future directions</article-title>
          <source>JMIR Med Educ</source>
          <year>2023</year>
          <month>06</month>
          <day>01</day>
          <volume>9</volume>
          <fpage>e48291</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2023//e48291/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/48291</pub-id>
          <pub-id pub-id-type="medline">37261894</pub-id>
          <pub-id pub-id-type="pii">v9i1e48291</pub-id>
          <pub-id pub-id-type="pmcid">PMC10273039</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Burke</surname>
              <given-names>HB</given-names>
            </name>
            <name name-style="western">
              <surname>Hoang</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lopreiato</surname>
              <given-names>JO</given-names>
            </name>
            <name name-style="western">
              <surname>King</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hemmer</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Montgomery</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gagarin</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Assessing the ability of a large language model to score free-text medical student clinical notes: quantitative study</article-title>
          <source>JMIR Med Educ</source>
          <year>2024</year>
          <month>07</month>
          <day>25</day>
          <volume>10</volume>
          <fpage>e56342</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2024//e56342/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/56342</pub-id>
          <pub-id pub-id-type="medline">39118469</pub-id>
          <pub-id pub-id-type="pii">v10i1e56342</pub-id>
          <pub-id pub-id-type="pmcid">PMC11327632</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Choudhury</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chaudhry</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Large language models and user trust: consequence of self-referential learning loop and the deskilling of health care professionals</article-title>
          <source>J Med Internet Res</source>
          <year>2024</year>
          <month>04</month>
          <day>25</day>
          <volume>26</volume>
          <fpage>e56764</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2024//e56764/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/56764</pub-id>
          <pub-id pub-id-type="medline">38662419</pub-id>
          <pub-id pub-id-type="pii">v26i1e56764</pub-id>
          <pub-id pub-id-type="pmcid">PMC11082730</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Izquierdo-Condoy</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Arias-Intriago</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tello-De-la-Torre</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Busch</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ortiz-Prado</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Generative artificial intelligence in medical education: enhancing critical thinking or undermining cognitive autonomy?</article-title>
          <source>J Med Internet Res</source>
          <year>2025</year>
          <month>11</month>
          <day>03</day>
          <volume>27</volume>
          <fpage>e76340</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2025//e76340/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/76340</pub-id>
          <pub-id pub-id-type="medline">41183320</pub-id>
          <pub-id pub-id-type="pii">v27i1e76340</pub-id>
          <pub-id pub-id-type="pmcid">PMC12624298</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tamkin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>McCain</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Handa</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Durmus</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Lovitt</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Rathi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mountfield</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ritchie</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Stern</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Clarke</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Goldberg</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sumers</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Mueller</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>McEachen</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Mitchell</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Carter</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kaplan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ganguli</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Clio: privacy-preserving insights into real-world AI use</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on December 18, 2024</comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2412.13678</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <source>Google Gemini</source>
          <access-date>2026-06-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://gemini.google.com">https://gemini.google.com</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
