<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JME</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Educ</journal-id>
      <journal-title>JMIR Medical Education</journal-title>
      <issn pub-type="epub">2369-3762</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v11i1e62779</article-id>
      <article-id pub-id-type="pmid">40053752</article-id>
      <article-id pub-id-type="doi">10.2196/62779</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Detecting Artificial Intelligence–Generated Versus Human-Written Medical Student Essays: Semirandomized Controlled Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Lesselroth</surname>
            <given-names>Blake</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Bach</surname>
            <given-names>Carme</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Zhu</surname>
            <given-names>Lingxuan</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Corizzo</surname>
            <given-names>Roberto</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Doru</surname>
            <given-names>Berin</given-names>
          </name>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>University Hospital of Paediatrics and Adolescent Medicine, St. Josef-Hospital</institution>
            <institution>Ruhr University Bochum</institution>
            <addr-line>Alexandrinenstraße 5</addr-line>
            <addr-line>Bochum, 44791</addr-line>
            <country>Germany</country>
            <phone>49 234 509 2611</phone>
            <email>Berin.Doru@rub.de</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0008-1067-7468</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Maier</surname>
            <given-names>Christoph</given-names>
          </name>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1212-744X</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Busse</surname>
            <given-names>Johanna Sophie</given-names>
          </name>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0007-1923-3575</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Lücke</surname>
            <given-names>Thomas</given-names>
          </name>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6875-6582</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Schönhoff</surname>
            <given-names>Judith</given-names>
          </name>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0007-5656-4816</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Enax- Krumova</surname>
            <given-names>Elena</given-names>
          </name>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6162-9414</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Hessler</surname>
            <given-names>Steffen</given-names>
          </name>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0009-0225-6169</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Berger</surname>
            <given-names>Maria</given-names>
          </name>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0008-6191-9623</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Tokic</surname>
            <given-names>Marianne</given-names>
          </name>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9789-575X</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>University Hospital of Paediatrics and Adolescent Medicine, St. Josef-Hospital</institution>
        <institution>Ruhr University Bochum</institution>
        <addr-line>Bochum</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Departement of German Philology, General and Comparative Literary Studies</institution>
        <institution>Ruhr University Bochum</institution>
        <addr-line>Bochum</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Neurology, BG University Hospital Bergmannsheil gGmbH Bochum</institution>
        <institution>Ruhr University Bochum</institution>
        <addr-line>Bochum</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>German Department, German Linguistics</institution>
        <institution>Ruhr University Bochum</institution>
        <addr-line>Bochum</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>German Department, Digital Forensic Linguistics</institution>
        <institution>Ruhr University Bochum</institution>
        <addr-line>Bochum</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Department for Medical Informatics, Biometry and Epidemiology</institution>
        <institution>Ruhr University Bochum</institution>
        <addr-line>Bochum</addr-line>
        <country>Germany</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Berin Doru <email>Berin.Doru@rub.de</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2025</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>3</day>
        <month>3</month>
        <year>2025</year>
      </pub-date>
      <volume>11</volume>
      <elocation-id>e62779</elocation-id>
      <history>
        <date date-type="received">
          <day>31</day>
          <month>5</month>
          <year>2024</year>
        </date>
        <date date-type="rev-request">
          <day>12</day>
          <month>8</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>28</day>
          <month>11</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>16</day>
          <month>1</month>
          <year>2025</year>
        </date>
      </history>
      <copyright-statement>©Berin Doru, Christoph Maier, Johanna Sophie Busse, Thomas Lücke, Judith Schönhoff, Elena Enax- Krumova, Steffen Hessler, Maria Berger, Marianne Tokic. Originally published in JMIR Medical Education (https://mededu.jmir.org), 03.03.2025.</copyright-statement>
      <copyright-year>2025</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Education, is properly cited. The complete bibliographic information, a link to the original publication on https://mededu.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://mededu.jmir.org/2025/1/e62779" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Large language models, exemplified by ChatGPT, have reached a level of sophistication that makes distinguishing between human- and artificial intelligence (AI)–generated texts increasingly challenging. This has raised concerns in academia, particularly in medicine, where the accuracy and authenticity of written work are paramount.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This semirandomized controlled study aims to examine the ability of 2 blinded expert groups with different levels of content familiarity—medical professionals and humanities scholars with expertise in textual analysis—to distinguish between longer scientific texts in German written by medical students and those generated by ChatGPT. Additionally, the study sought to analyze the reasoning behind their identification choices, particularly the role of content familiarity and linguistic features.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Between May and August 2023, a total of 35 experts (medical: n=22; humanities: n=13) were each presented with 2 pairs of texts on different medical topics. Each pair had similar content and structure: 1 text was written by a medical student, and the other was generated by ChatGPT (version 3.5, March 2023). Experts were asked to identify the AI-generated text and justify their choice. These justifications were analyzed through a multistage, interdisciplinary qualitative analysis to identify relevant textual features. Before unblinding, experts rated each text on 6 characteristics: linguistic fluency and spelling/grammatical accuracy, scientific quality, logical coherence, expression of knowledge limitations, formulation of future research questions, and citation quality. Univariate tests and multivariate logistic regression analyses were used to examine associations between participants’ characteristics, their stated reasons for author identification, and the likelihood of correctly determining a text’s authorship.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Overall, in 48 out of 69 (70%) decision rounds, participants accurately identified the AI-generated texts, with minimal difference between groups (medical: 31/43, 72%; humanities: 17/26, 65%; odds ratio [OR] 1.37, 95% CI 0.5-3.9). While content errors had little impact on identification accuracy, stylistic features—particularly redundancy (OR 6.90, 95% CI 1.01-47.1), repetition (OR 8.05, 95% CI 1.25-51.7), and thread/coherence (OR 6.62, 95% CI 1.25-35.2)—played a crucial role in participants’ decisions to identify a text as AI-generated.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The findings suggest that both medical and humanities experts were able to identify ChatGPT-generated texts in medical contexts, with their decisions largely based on linguistic attributes. The accuracy of identification appears to be independent of experts’ familiarity with the text content. As the decision-making process primarily relies on linguistic attributes—such as stylistic features and text coherence—further quasi-experimental studies using texts from other academic disciplines should be conducted to determine whether instructions based on these features can enhance lecturers’ ability to distinguish between student-authored and AI-generated work.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>artificial intelligence</kwd>
        <kwd>ChatGPT</kwd>
        <kwd>large language models</kwd>
        <kwd>textual analysis</kwd>
        <kwd>writing style</kwd>
        <kwd>AI</kwd>
        <kwd>chatbot</kwd>
        <kwd>LLMs</kwd>
        <kwd>detection</kwd>
        <kwd>authorship</kwd>
        <kwd>medical student</kwd>
        <kwd>textual analysis</kwd>
        <kwd>linguistic quality</kwd>
        <kwd>decision-making</kwd>
        <kwd>logical coherence</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>The rapid development of artificial intelligence (AI) and the emergence of large language models (LLMs), such as ChatGPT, have increasingly blurred the lines between human-written and AI-generated text. This has created a significant challenge in identifying the authorship of written work, especially as the use of AI has become ubiquitous since chatbots have become freely available [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. Consequently, critical concerns have arisen in the educational and academic sectors, where the reliability and authenticity of written work are fundamental.</p>
      <p>According to a recent nationwide survey, nearly two-thirds of the German students reported using AI-based tools for their studies, with ChatGPT being the most commonly used chatbot [<xref ref-type="bibr" rid="ref3">3</xref>]. ChatGPT, developed by OpenAI, an American AI research laboratory, is a state-of-the-art AI chatbot capable of assisting users with a wide range of tasks, from text generation to problem-solving [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. Its capabilities have opened up significant opportunities for educational and academic contexts. For example, AI-based tools like ChatGPT can support tasks such as text analysis, translation, and proofreading for research purposes [<xref ref-type="bibr" rid="ref6">6</xref>]. They also can provide support to students by enhancing their understanding of scientific methods, improving and refining written work, and assisting with examination preparation [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref7">7</xref>].</p>
      <p>However, the widespread use of such tools raises concerns about their impact on students’ development of critical and independent thinking skills [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. In addition, it is possible that ChatGPT could provide incomplete or inaccurate information, potentially leading to misunderstandings of academic concepts and topics [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. Further concerns arise from the potential for academic dishonesty and plagiarism, particularly in the context of written assignments and academic essays [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref12">12</xref>].</p>
      <p>The lack of clarity on how to handle such cases is putting universities in a quandary, leading to the first court cases and, more recently, to the University of Munich being vindicated in its decision to reject such written work [<xref ref-type="bibr" rid="ref13">13</xref>]. In this case, an essay submitted as part of a Master’s application was rejected because it was “too well written,” raising suspicions that the text was likely generated by an AI tool such as ChatGPT [<xref ref-type="bibr" rid="ref13">13</xref>]. This case highlights that AI-generated texts are often characterized by their seemingly perfected style of formulation that refers to the linguistic level [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>], a characteristic that is known to be particularly pronounced and even more nuanced in English output texts compared with other languages such as German [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref18">18</xref>].</p>
      <p>The relevance of the problem for medical studies is not obvious at first glance because medical students generally do not have to write long scientific texts on a regular basis during their studies, but usually only for their doctoral thesis. However, the increasing use of AI tools such as ChatGPT also poses challenges in the medical field, where assessments rely not only on linguistic quality but also on content accuracy. The potential misattribution of authorship in medical texts—such as research articles, patient information, or promotional materials—has particularly serious implications, as errors or inaccuracies in these contexts can have grave consequences. It can be assumed that medical texts do not fall as much within the scope of ChatGPT and are therefore more difficult to reproduce accurately, especially because AI authors have no “moral scruples” about concealing ignorance and replacing verified sources with falsified ones [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref22">22</xref>]. However, a few studies have addressed the problem of AI-generated content on medical texts [<xref ref-type="bibr" rid="ref21">21</xref>-<xref ref-type="bibr" rid="ref26">26</xref>], reporting that ChatGPT has, at times, managed to mislead medical professionals [<xref ref-type="bibr" rid="ref26">26</xref>], which may suggest that familiarity with content plays a minor role in authorship identification.</p>
      <p>Existing research on LLM-based text generators such as ChatGPT frequently focuses on their role in assisting the writing process rather than evaluating the quality and detectability of longer scientific texts [<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref29">29</xref>]. In addition, studies often investigate the detection of texts written by chatbots using automatic tools or even detectors specifically designed for this purpose [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref30">30</xref>]. The detection rate of these detectors is often higher than that of human reviewers, but the accuracy can vary greatly depending on the text genre and the classifier used [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref31">31</xref>]. Moreover, linguistic features appear to be the most important subset of features influencing the performance of feature-based classifiers [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. In the academic domain, educators still face the challenge of qualitatively assessing the authenticity of student texts, often without the aid of automated detection tools.</p>
      <p>It is therefore of particular interest to determine how well human readers from the academic field can detect differences when directly comparing 2 texts on the same topic—an original student text and an AI-generated text—and which features stand out as particularly conspicuous and decisive for them. To better distinguish between the relevance of content-related and text-analytical attributes, we assembled a group of language experts from the humanities field alongside a group of medical experts specializing in pediatrics and neurology. Another key novelty and prerequisite of our study is the use of fully reproduced, longer scientific texts on medical topics written in German by medical students.</p>
      <p>Therefore, we conducted a study to determine whether medical experts and humanities lecturers could distinguish between texts written by medical students and those generated by ChatGPT (specifically ChatGPT version 3.5, March 23). Unlike the interactive “Turing Test” [<xref ref-type="bibr" rid="ref32">32</xref>], this task was not performed through a dialogue with a machine but rather through an internal, personal evaluation of 2 texts. We hypothesize that, in line with the Turing prophecy [<xref ref-type="bibr" rid="ref32">32</xref>], the correct identification rate for AI-generated texts within a German medical sample is approximately 70%, with content familiarity playing a secondary role, while formal and linguistic features exert a greater influence.</p>
      <p>Through a prospective analysis of longer German-language scientific texts written by students in the specialized health-related field of medicine, this study aims to provide new insights into AI-generated texts and the influence of content familiarity and linguistic expertise. The findings are intended to inform the development of guidelines to help lecturers (and others) recognize AI-generated texts, even in the absence of a comparable “original” text, and to contribute to future projects addressing the challenges posed by AI tools in academia.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Recruitment Process</title>
        <p>This semirandomized controlled trial was conducted between May and August 2023 at the University Hospital of Pediatrics and Adolescent Medicine, St. Josef-Hospital, Ruhr University Bochum (RUB), Germany. To recruit participants, an open call was issued to the Department of Pediatrics and Adolescent Medicine and the Department of Neurology at the University Hospital Bergmannsheil (both RUB). Senior physicians and members of scientific working groups were invited to participate, ensuring the involvement of clinical experts familiar with the content of the texts. Participation was voluntary, with clinical employment or medical expertise serving as key inclusion criteria, along with an interest in scientific texts. In the next phase of recruitment, a call was made to the Faculty of Humanities at Ruhr University to include participants with experience in text reception and analysis, with teaching experience as an additional inclusion criterion.</p>
      </sec>
      <sec>
        <title>Design</title>
        <p>Each participant received 2 pairs of texts, totaling 4 printed texts. Each pair consisted of 1 of 18 available term papers written by a medical student and a corresponding text generated by ChatGPT (version 3.5, March 2023), with the order of presentation randomized. The medical experts received 1 pair of texts on a topic closely related to their specialty and another pair on a less familiar topic. For example, a pediatrician received the text “Autoantibodies in Diabetes Mellitus,” while a neurologist received “Measurement of Aδ and C Fibers in Electrophysiology.” The second pair of texts covered a topic less directly related to their field of expertise.</p>
        <p>Given the exploratory nature of the study, it became increasingly evident—only after completing the experimental phase with the medical experts—that the extent to which content familiarity influences the identification process needed further examination, particularly in comparison to formal and linguistic aspects.</p>
        <p>As a result, a second phase of the study was initiated, involving a new group of experts with greater expertise in formal and linguistic analyses. This allowed for a comparison of results and evaluations across groups. In this group of humanities experts, each participant received the same 2 pairs of texts to ensure better comparability and verification of subject unfamiliarity. The first pair addressed a more general topic also familiar to nonmedical fields: “Iodine Deficiency.” The second pair analyzed a more specialized medical topic: “Autoantibodies in Diabetes Mellitus.”</p>
        <p>Participants were asked to read a pair of texts and, based on their personal experience with student-written texts, decide within a week—without extensive research—which of the 2 they believed was generated by ChatGPT. To ensure the blinding of both interviewers and participants, the headers of the texts contained only a randomly generated 3-digit number and a “chatbot or student” checkbox. Before the subsequent interview, participants documented their decision by ticking the corresponding box for their chosen text version. They were also instructed not to discuss the task or the texts with one another.</p>
        <p>About 1-2 weeks after the texts were distributed, participants were invited to a semistructured interview—conducted in person, by telephone, or via Zoom (Zoom Communications/Qumu Corporation)—to discuss their decisions, reasoning, and evaluations of the texts. Unblinding occurred after the interviews.</p>
      </sec>
      <sec>
        <title>Creation of the ChatGPT-Generated Versions</title>
        <p>Eighteen German-language medical essays served as templates for the ChatGPT-generated texts. These essays were written by doctoral students from the University Pediatric Clinic and the Clinic for Neurology at Bergmannsheil University Hospital, RUB, Germany. They originated from the Doctoral Colloquium pool at the University Hospital of Pediatrics and Adolescent Medicine in Bochum. As part of the colloquium, each doctoral student is encouraged to write a scientific essay thematically related to their announced dissertation topic. To provide an initial experience with scientific research and writing—and to give the reviewing study coordinator a first impression of their academic level and skills—students do not receive specific instructions. For this study, all available German texts from this pool that were written before the general introduction of ChatGPT were considered, provided their authors consented to their use.</p>
        <p>We used ChatGPT version 3.5, March 14 to replicate the texts. To generate a version with the same title and outline as the original papers while avoiding text breaks, 2 separate prompts were required to produce a continuous text from the introduction to the conclusion (<xref ref-type="table" rid="table1">Table 1</xref>).</p>
        <p>For the main part, depending on the type of original paper, several commands were necessary. For example, see <xref ref-type="table" rid="table2">Table 2</xref>.</p>
        <p>We then merged the individual sections to create a complete term paper, supplementing it with a bibliography that listed the sources provided by ChatGPT in sequential order. To ensure consistency, we harmonized the formatting of both ChatGPT-generated and student-written texts as much as possible, using the Arial font (size 11 for body text and size 12 for headings) with justified alignment. Sections or sentences specific to a student’s individual dissertation project were removed to maintain general applicability. However, we did not alter the choice of words, sentence structure, punctuation, spelling, or citation style.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Prompts used to create ChatGPT text.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td>German (original prompt)</td>
                <td>English (translation)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>“Schreibe bitte einen Abschnitt über das Thema [TITEL DES TEILTHEMAS] der [wissenschaftlichen/medizinischen] Hausarbeit [TITEL DER HAUSARBEIT].”</p>
                    </list-item>
                    <list-item>
                      <p>“Belege Deine Aussagen mit Quellen, die bei Pubmed auffindbar sind.”</p>
                    </list-item>
                  </list>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>“Please write a section on the topic [NAME OF SUBTOPIC] of the [scientific/medical] term paper [NAME OF TERM PAPER].”</p>
                    </list-item>
                    <list-item>
                      <p>“Support your statements with sources that can be found on PubMed.”</p>
                    </list-item>
                  </list>
                </td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Additional instructions used to create ChatGPT text.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td>German (original prompt)</td>
                <td>English (translation)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>“Schreibe einen Abschnitt zum Thema ‘Potenziell reversible Pathomechanismen als mögliche Ursachen von Hyposmie oder Anosmie bei Kindern’ der wissenschaftlichen Hausarbeit ‘Ursachen und Diagnostik von Riechstörungen bei Kindern und Jugendlichen’, der an den vorherigen Abschnitt anknüpft.”</td>
                <td>“Write a section on the topic ‘Potentially reversible pathomechanism as possible causes of hyposmia or anosmia in children’ of the scientific paper ‘Causes and diagnostics of olfactory dysfunction in children and adolescents’, which ties in with the previous section.”</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Data Assessment During the Interview</title>
        <p>The medical expert group was interviewed by 2 blinded interviewers (BD and JSB), while the humanities expert group was interviewed by a partially blinded interviewer (CM). Initially, participants provided demographic information, including age, experience in academic and student teaching, academic qualifications, publication history, and prior experience with ChatGPT. They were then asked to assess how well the following questions were addressed in each text, using the German grading system from 1 (very good) to 6 (unsatisfactory) (see <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for details). How would you rate (1) linguistic fluency, (2) scientific quality (eg, are the re-definitions scientifically derived and are studies cited that lead to certain conclusions?), (3) internal logic, (4) description of the limitations of current knowledge, (5) future research questions, and (6) citations and references of the text? Participants were then asked to identify which text version, using the corresponding 3-digit number, they had categorized as being generated by ChatGPT and to list the key reasons for their decision, which the interviewer recorded using keywords. Next, they rated their confidence in their decision on a scale from 1 (very confident) to 6 (not confident at all). After this initial assessment, participants were unblinded and informed which text had been written by a student and which by ChatGPT. In cases of misidentification, they were asked about their suspected reasons, which the interviewer also documented using keywords.</p>
      </sec>
      <sec>
        <title>Construction of Categories</title>
        <p>Beyond the identification rate and the text evaluations by each group, a qualitative analysis of participants’ statements regarding their reasoning for assigning authorship proved essential. This deeper analysis aimed to examine the influence of content-related versus formal-linguistic aspects and to better attribute global features to either student or chatbot authorship. For this purpose, the free-text responses (recorded by interviewers using keywords) were first thematically clustered based on the terms mentioned (see sample statements in the <italic>Free-Text Analysis</italic> section). Subsequently, through multiturn discussions between medical and linguistic experts, these thematic clusters were refined into distinct, nonoverlapping categories that encompassed all interviewee statements while reducing redundancy and multiple classifications.</p>
        <p>Many of these categories align with standard text-analytical frameworks, which typically cover a broad range of attributes, including morphology, syntax, style, structure, coherence and cohesion, content quality, form, and even sociolinguistic aspects [<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref35">35</xref>]. However, the categories derived in this study are directly based on the text types used in the experiments. As a result, they provide a more precise representation of the emerging and still undefined text type “AI-generated” and are therefore preferable (see <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> for an overview of the categories).</p>
      </sec>
      <sec>
        <title>Statistical Analysis</title>
        <p>Data were analyzed using Microsoft Excel, SPSS version 29.3 (IBM Corp.), and R-4.1.2 (R Foundation). Descriptive statistics are presented as numbers (n) and percentages or as means (SD), where appropriate. Univariate odds ratios and 95% CIs from the Fisher exact test were used to examine the association between demographic markers, participants’ field (medicine or humanities), and their expertise with the likelihood of correctly identifying a text’s source. The relationship between interview scores and response accuracy was assessed using the 2-sided Wilcoxon signed rank test for paired values. Additionally, correlations among all 5 responses were tested using a Friedman 2-way analysis of variance for ranks with Bonferroni correction.</p>
        <p>To analyze how participants attempted to identify the machine-generated text, we modeled the association of the derived categories (items) from the interviews based on their likelihood of being mentioned in the context of a chatbot-generated text. For each participant and interview, we recorded whether an item was cited in reference to a perceived chatbot text or a perceived student text. This association was analyzed using repeated-measures logistic regression, incorporating a random participant and sequence effect. The model was further adjusted for age group, the expert group (medical vs humanities), and prior experience with ChatGPT (binary).</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>An application for the study project was submitted to the Ethics Committee of the Medical Faculty at RUB (reference number 23-7837; April 2023). As the study did not involve direct research on human participants or patient data, the committee informed us that ethical approval was not required.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Interviewee Sample</title>
        <p>The biographical data of the 22 participating physicians (14 pediatricians, 3 nutritionists, 4 neurologists, and 1 neuroscientist) and 13 humanities scholars (8 literary scholars, 3 Germanists or linguists, 1 classical philologist, and 1 Romance philologist) are presented in <xref ref-type="table" rid="table3">Table 3</xref>.</p>
        <p>As there were more participating experts than available term papers, 3 pairs of texts were each assessed by 3 or 4 medical experts.</p>
        <p>At the time of the survey, only one-fifth of the participants reported having prior experience with ChatGPT. As the number of participating experts exceeded the number of available term papers, 3 pairs of texts were each assessed by 3 or 4 medical experts.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Interviewee sample.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="320"/>
            <col width="220"/>
            <col width="220"/>
            <col width="210"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Characteristics</td>
                <td>All participants (N=35)</td>
                <td>Medical experts (n=22)</td>
                <td>Humanities experts (n=13)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">
                  <bold>Age (years), n (%)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&lt;40</td>
                <td>17 (49)</td>
                <td>13 (59)</td>
                <td>4 (31)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥40</td>
                <td>18 (51)</td>
                <td>9 (41)</td>
                <td>9 (69)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Experience in academic teaching<sup>a</sup> (years), n (%)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>None</td>
                <td>2 (6)</td>
                <td>2 (9)</td>
                <td>N/A<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&lt;5</td>
                <td>8 (23)</td>
                <td>8 (36)</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥5</td>
                <td>25 (71)</td>
                <td>12 (55)</td>
                <td>13 (100)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>PhD/professorship, n (%)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Yes</td>
                <td>28 (80)</td>
                <td>18 (82)</td>
                <td>10 (77)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Authorship in a publication, n (%)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Yes</td>
                <td>32 (91)</td>
                <td>20 (91)</td>
                <td>12 (92)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Experience with ChatGPT<sup>a</sup>, n (%)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Yes</td>
                <td>7 (20)</td>
                <td>2 (9)</td>
                <td>5 (38)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Only a little</td>
                <td>7 (20)</td>
                <td>4 (18)</td>
                <td>3 (23)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No</td>
                <td>21 (60)</td>
                <td>16 (73)</td>
                <td>5 (38)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>Self-assessed.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>N/A: not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Detection Rate</title>
        <p>With 35 participants evaluating 2 text pairs each—excluding 1 misaligned and omitted case—a total of 69 decision rounds were conducted. In 48 out of 69 (70%) decision rounds, participants correctly identified the authorship of the texts. Medical and humanities experts showed a slight but nonsignificant difference in detection rates, with medical experts correctly identifying 31 out of 43 (72%) decision rounds compared with 17 out of 26 (65%) decision rounds by humanities experts (odds ratio 1.37, 95% CI 0.5-3.9). Among the 35 participants, 21 (60%) misidentified the authorship of at least one text pair, including 12 medical experts. Additionally, 5 (14%) participants, including 3 physicians, misidentified both text pairs.</p>
        <p>Notably, familiarity with the topic did not significantly impact identification accuracy (<xref ref-type="table" rid="table4">Table 4</xref>), nor did personal characteristics such as age, academic qualifications, or years of teaching experience. However, younger participants without advanced academic titles showed a slight tendency to better identify ChatGPT-generated texts. Confidence in participants’ own judgments did not differ significantly across groups (odds ratio 0.6, 95% CI 0.2-1.79).</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Characteristics of the participants with correct and incorrect decisions about the authorship of the respective text.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="170"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="120"/>
            <col width="0"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="130"/>
            <col width="0"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="130"/>
            <col width="0"/>
            <col width="0"/>
            <thead>
              <tr valign="top">
                <td rowspan="3" colspan="3">Characteristics</td>
                <td colspan="7">All participants</td>
                <td colspan="7">Medical experts</td>
                <td colspan="7">Humanities experts</td>
              </tr>
              <tr valign="top">
                <td colspan="7">Decision</td>
                <td colspan="7">Decision</td>
                <td colspan="7">Decision</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Correct</td>
                <td colspan="2">False</td>
                <td colspan="2">OR<sup>a</sup> (95% CI)</td>
                <td colspan="3">Correct</td>
                <td colspan="2">False</td>
                <td colspan="2">OR (95% CI)</td>
                <td colspan="3">Correct</td>
                <td colspan="2">False</td>
                <td colspan="2">OR (95% CI)</td>
                <td>
                  <break/>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">Tests, n (%)</td>
                <td colspan="2">48 (70)</td>
                <td colspan="2">21 (30)</td>
                <td colspan="2">N/A<sup>b</sup></td>
                <td colspan="3">31 (72)</td>
                <td colspan="2">12 (28)</td>
                <td colspan="2">N/A</td>
                <td colspan="3">17 (65)</td>
                <td colspan="2">9 (35)</td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Age (years), n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&lt;40</td>
                <td colspan="2">24 (73)</td>
                <td colspan="2">9 (27)</td>
                <td colspan="2">N/A</td>
                <td colspan="3">17 (68)</td>
                <td colspan="2">8 (32)</td>
                <td colspan="2">N/A</td>
                <td colspan="3">7 (88)</td>
                <td colspan="2">1 (12)</td>
                <td colspan="2">N/A</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥40</td>
                <td colspan="2">24 (67)</td>
                <td colspan="2">12 (33)</td>
                <td colspan="2">0.75 (0.27-2.11)</td>
                <td colspan="3">14 (78)</td>
                <td colspan="2">4 (22)</td>
                <td colspan="2">1.65 (0.41-6.63)</td>
                <td colspan="3">10 (56)</td>
                <td colspan="2">8 (44)</td>
                <td colspan="2">0.18 (0.02-1.77)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>PhD/professorship, n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Yes</td>
                <td colspan="2">37 (67)</td>
                <td colspan="2">18 (33)</td>
                <td colspan="2">N/A</td>
                <td colspan="3">25 (71)</td>
                <td colspan="2">10 (29)</td>
                <td colspan="2">N/A</td>
                <td colspan="3">12 (60)</td>
                <td colspan="2">8 (40)</td>
                <td colspan="2">N/A</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No</td>
                <td colspan="2">11 (78.6)</td>
                <td colspan="2">3 (21.4)</td>
                <td colspan="2">1.78 (0.44-7.2)</td>
                <td colspan="3">6 (75)</td>
                <td colspan="2">2 (25)</td>
                <td colspan="2">1.2 (0.21-6.98)</td>
                <td colspan="3">5 (83.3)</td>
                <td colspan="2">1 (16.7)</td>
                <td colspan="2">3.33 (0.33-34.12)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Experience in academic teaching<sup>c</sup> (years), n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥5</td>
                <td colspan="2">30 (67)</td>
                <td colspan="2">15 (33)</td>
                <td colspan="2">N/A</td>
                <td colspan="3">16 (70)</td>
                <td colspan="2">7 (30)</td>
                <td colspan="2">N/A</td>
                <td colspan="3">14 (64)</td>
                <td colspan="2">8 (36)</td>
                <td colspan="2">N/A</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&lt;5 or none</td>
                <td colspan="2">18 (75)</td>
                <td colspan="2">6 (25)</td>
                <td colspan="2">1.5 (0.49-4.56)</td>
                <td colspan="3">15 (75)</td>
                <td colspan="2">5 (25)</td>
                <td colspan="2">1.31 (0.34-5.05)</td>
                <td colspan="3">3 (75)</td>
                <td colspan="2">1 (25)</td>
                <td colspan="2">1.71 (0.15-19.36)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Authorship in a publication, n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Yes</td>
                <td colspan="2">44 (70)</td>
                <td colspan="2">19 (30)</td>
                <td colspan="2">N/A</td>
                <td colspan="3">28 (72)</td>
                <td colspan="2">11 (28)</td>
                <td colspan="2">N/A</td>
                <td colspan="3">16 (67)</td>
                <td colspan="2">8 (33)</td>
                <td colspan="2">N/A</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No</td>
                <td colspan="2">4 (67)</td>
                <td colspan="2">2 (33)</td>
                <td colspan="2">0.86 (0.15-5.12)</td>
                <td colspan="3">3 (75)</td>
                <td colspan="2">1 (25)</td>
                <td colspan="2">1.18 (0.11-12.59)</td>
                <td colspan="3">1 (50)</td>
                <td colspan="2">1 (50)</td>
                <td colspan="2">0.5 (0.03-9.08)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Experience with ChatGPT<sup>c</sup>, n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Yes</td>
                <td colspan="2">20 (74)</td>
                <td colspan="2">7 (26)</td>
                <td colspan="2">N/A</td>
                <td colspan="3">9 (82)</td>
                <td colspan="2">2 (18)</td>
                <td colspan="2">N/A</td>
                <td colspan="3">11 (69)</td>
                <td colspan="2">5 (31)</td>
                <td colspan="2">N/A</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>No</td>
                <td colspan="2">28 (67)</td>
                <td colspan="2">14 (33)</td>
                <td colspan="2">0.7 (0.24-2.05)</td>
                <td colspan="3">22 (69)</td>
                <td colspan="2">10 (31)</td>
                <td colspan="2">0.49 (0.09-2.69)</td>
                <td colspan="3">6 (60)</td>
                <td colspan="2">4 (40)</td>
                <td colspan="2">0.68 (0.13-3.55)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Text pair (sequence), n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>First</td>
                <td colspan="2">23 (66)</td>
                <td colspan="2">12 (34)</td>
                <td colspan="2">N/A</td>
                <td colspan="3">16 (73)</td>
                <td colspan="2">6 (27)</td>
                <td colspan="2">N/A</td>
                <td colspan="3">7 (54)</td>
                <td colspan="2">6 (46)</td>
                <td colspan="2">N/A</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Second</td>
                <td colspan="2">25 (74)</td>
                <td colspan="2">9 (26)</td>
                <td colspan="2">0.75 (0.27-2.09)</td>
                <td colspan="3">15 (71)</td>
                <td colspan="2">6 (29)</td>
                <td colspan="2">0.94 (0.25-3.56)</td>
                <td colspan="3">10 (77)</td>
                <td colspan="2">3 (23)</td>
                <td colspan="2">2.86 (0.53-15.47)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Familiar with the topic, n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>More</td>
                <td colspan="2">25 (68)</td>
                <td colspan="2">12 (32)</td>
                <td colspan="2">N/A</td>
                <td colspan="3">18 (75)</td>
                <td colspan="2">6 (25)</td>
                <td colspan="2">N/A</td>
                <td colspan="3">7 (54)</td>
                <td colspan="2">6 (46)</td>
                <td colspan="2">N/A</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Less</td>
                <td colspan="2">23 (72)</td>
                <td colspan="2">9 (28)</td>
                <td colspan="2">1.01 (0.36-2.8)</td>
                <td colspan="3">13 (68)</td>
                <td colspan="2">6 (32)</td>
                <td colspan="2">0.72 (0.19-2.75)</td>
                <td colspan="3">10 (77)</td>
                <td colspan="2">3 (23)</td>
                <td colspan="2">2.86 (0.53-15.47)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Self-confidence in the decision<sup>c</sup>, n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Rather sure</td>
                <td colspan="2">35 (73)</td>
                <td colspan="2">13 (27)</td>
                <td colspan="2">N/A</td>
                <td colspan="3">22 (76)</td>
                <td colspan="2">7 (24)</td>
                <td colspan="2">N/A</td>
                <td colspan="3">13 (68)</td>
                <td colspan="2">6 (32)</td>
                <td colspan="2">N/A</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Unsure</td>
                <td colspan="2">13 (62)</td>
                <td colspan="2">8 (38)</td>
                <td colspan="2">0.6 (0.2-1.79)</td>
                <td colspan="3">9 (64)</td>
                <td colspan="2">5 (36)</td>
                <td colspan="2">0.57 (0.14-2.29)</td>
                <td colspan="3">4 (57)</td>
                <td colspan="2">3 (43)</td>
                <td colspan="2">0.62 (0.1-3.66)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>OR: odds ratio for the correct decision.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>N/A: not applicable.</p>
            </fn>
            <fn id="table4fn3">
              <p><sup>c</sup>Self-assessed.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Interview Analysis</title>
        <p>When authorship was correctly identified, texts written by medical students received notably higher ratings for stylistic fluency, the internal logic of argumentation, and scientific quality (see <xref rid="figure1" ref-type="fig">Figure 1</xref>A, right-hand side). These differences were less pronounced in the assessment of knowledge limitations and future research directions. Regardless of correct identification, the way sources were cited was consistently rated higher in student-authored texts (<xref rid="figure1" ref-type="fig">Figure 1</xref>). Among humanities experts, score differences between correctly and incorrectly classified texts were minimal, though the academic quality of student-written texts was still rated significantly (<italic>r</italic>=0.336, <italic>P</italic>=.009) higher overall (<xref rid="figure1" ref-type="fig">Figure 1</xref>B, right-hand side). Many participants who misidentified the authorship attributed their errors to either underestimating the quality of student work or overestimating ChatGPT’s capabilities—particularly in terms of logical coherence, the presentation of scientific knowledge limitations, and the formulation of new research ideas.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Association of mean school grade (using German school grades 1=very good to 6=unsatisfactory) and correctness of authoring identification in (A) medical experts and (B) humanities experts. Participants were not yet unblinded at the time of assessment (see <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for details). Left side: incorrect attribution, right side: correct attribution of authorship. *<italic>P</italic>&lt;.05 (2-sided Wilcoxon signed rank test). C: chatbot-generated text; S: student text.</p>
          </caption>
          <graphic xlink:href="mededu_v11i1e62779_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Free-Text Analysis</title>
        <p>We categorized the 187 freely formulated reasons participants provided for their decisions into 1 of 12 derived categories (see <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). Three categories were excluded from statistical analysis due to their low frequency: inconsistency of writing style (n=4), other issues (n=4), and errors in content (n=3). Notably, all 3 content-error attributions came from the medical expert group. Of the remaining 176 statements, 88 (50%) were contributed by medical experts and 88 (50%) by humanities scholars (<xref ref-type="table" rid="table5">Table 5</xref>).</p>
        <p>The experiment revealed that significantly more statements were made about (suspected) ChatGPT-generated texts (130/176, 73.9%) than about student-written texts, regardless of whether the suspicion was correct (<xref ref-type="table" rid="table5">Table 5</xref>). Sample statements from both groups are provided in <xref ref-type="table" rid="table6">Tables 6</xref> and <xref ref-type="table" rid="table7">7</xref>. Medical experts’ explanations were often concise, frequently critiquing a “superficial” style with “unnecessary additional information.” By contrast, humanities experts tended to provide more detailed justifications, describing characteristics such as “smooth style” and “redundancies.”</p>
        <p>We analyzed the likelihood of specific categories being mentioned in reference to texts suspected to be generated by ChatGPT. The results indicate that “redundancy” (12/14, 86%, associated with GPT vs 2/14, 14%, with student texts), “repetition” (20/22, 91% vs 2/22, 9%), and “common thread and coherence” (21/24, 88% vs 3/24, 13%) were the most frequently cited characteristics (<xref rid="figure2" ref-type="fig">Figure 2</xref>).</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>The remaining 9 categories and item frequency by presumed nature of the text (for a detailed explanation in German and English, see <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="70"/>
            <col width="240"/>
            <col width="130"/>
            <col width="140"/>
            <col width="140"/>
            <col width="140"/>
            <col width="140"/>
            <thead>
              <tr valign="top">
                <td>Item</td>
                <td>Category</td>
                <td colspan="5">How often mentioned</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Overall, n (%)</td>
                <td colspan="2">Humanities</td>
                <td colspan="2">Medical experts</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Chatbot, n (%)</td>
                <td>Students, n (%)</td>
                <td>Chatbot, n (%)</td>
                <td>Students, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>176 (100)</td>
                <td>59 (33.5)</td>
                <td>29 (16.5)</td>
                <td>71 (40.3)</td>
                <td>17 (9.7)</td>
              </tr>
              <tr valign="top">
                <td>1</td>
                <td>Differentiated content</td>
                <td>16 (9.1)</td>
                <td>4 (6.8)</td>
                <td>4 (13.8)</td>
                <td>4 (5.6)</td>
                <td>4 (23.5)</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>Superficial content</td>
                <td>13 (7.4)</td>
                <td>2 (3.4)</td>
                <td>2 (6.9)</td>
                <td>8 (11.3)</td>
                <td>1 (5.9)</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>Redundancy</td>
                <td>14 (8.0)</td>
                <td>7 (11.9)</td>
                <td>2 (6.9)</td>
                <td>5 (7.0)</td>
                <td>N/A<sup>a</sup></td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>Monotonous structure of sentences</td>
                <td>14 (8.0)</td>
                <td>6 (10.2)</td>
                <td>4 (13.8)</td>
                <td>4 (5.6)</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>Repetition</td>
                <td>22 (12.5)</td>
                <td>8 (13.6)</td>
                <td>1 (3.4)</td>
                <td>12 (16.9)</td>
                <td>1 (5.9)</td>
              </tr>
              <tr valign="top">
                <td>6</td>
                <td>Common thread coherency</td>
                <td>24 (13.6)</td>
                <td>10 (16.9)</td>
                <td>2 (6.9)</td>
                <td>11 (15.5)</td>
                <td>1 (5.9)</td>
              </tr>
              <tr valign="top">
                <td>7</td>
                <td>Distinctive literature style</td>
                <td>16 (9.1)</td>
                <td>3 (5.1)</td>
                <td>2 (6.9)</td>
                <td>8 (11.3)</td>
                <td>3 (17.6)</td>
              </tr>
              <tr valign="top">
                <td>8</td>
                <td>Form</td>
                <td>25 (14.2)</td>
                <td>6 (10.2)</td>
                <td>6 (20.7)</td>
                <td>9 (12.7)</td>
                <td>4 (23.5)</td>
              </tr>
              <tr valign="top">
                <td>9</td>
                <td>Distinctive Wording</td>
                <td>32 (18.2)</td>
                <td>13 (22.0)</td>
                <td>6 (20.7)</td>
                <td>10 (14.1)</td>
                <td>3 (17.6)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>N/A: not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table6">
          <label>Table 6</label>
          <caption>
            <p>Excerpt from the statements of the medical expert group on the main reasons for choosing ChatGPT as the author.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td>German (original statement)</td>
                <td>English (translation)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>“‚erschien zu perfekt geschrieben, oberflächlich‘”</td>
                <td>“‚seemed too perfectly written, superficial’”</td>
              </tr>
              <tr valign="top">
                <td>“‚unnützes Wissen, Zusatzinfos, die nicht notwendig für die Arbeit wären‘”</td>
                <td>“‚useless knowledge, additional information that is not necessary for the work‘”</td>
              </tr>
              <tr valign="top">
                <td>“‚fehlender roter Faden, fehlende Kontinuität der Logik’”</td>
                <td>“‚lack of common thread, lack of continuity of logic’”</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table7">
          <label>Table 7</label>
          <caption>
            <p>Excerpt from the statements of the humanities expert group on the main reasons for choosing ChatGPT as the author.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td>German (original statement)</td>
                <td>English (translation)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>“‚fehlende Kohärenz, Redundanz, Monotonie […] ist sehr redundant, wiederholt Formulierungen teils mehrfach in Variationen. Der Definitionsteil wirkt reihend, stilistisch homogen, […] teils erfährt man, was man sich hätte denken können, […]. Der letzte Absatz wiederholt in etwa, was vorher da stand - was so wirkt, als hätte er diesen schon 'vergessen'.”</td>
                <td>“‚lack of coherence, redundancy, monotony [...] is very redundant, repeats formulations sometimes several times in variations. The definition section appears to be sequential, stylistically homogeneous, [...] partly one learns what one could have imagined, [...]. The last paragraph roughly repeats what was there before - which makes it seem as if he had already 'forgotten' it.”</td>
              </tr>
              <tr valign="top">
                <td>“‚Smooth, fließende Übergänge, aber übertextlich schlechter, d.h. gesamt Kohärenz schlechter (Wiederholung), habe nichts gelernt‘.”</td>
                <td>“‚Smooth, fluent transitions, but overtextually worse, i.e. overall coherence worse (repetition), 'haven't learned anything'.”</td>
              </tr>
              <tr valign="top">
                <td>“‚Wiederholung vieler Sätze und Inhalte; ausgeprägte Tendenz zu bestimmten schablonenartigen Formulierungen im Sinne einer ‘Anmoderation’, z.T. phrasenhaft ohne Inhalt. Optisch gute Gliederung (vorgegeben durch die Überschriften), jedoch roter Faden nicht gut erkennbar, vieles wirkt lediglich wie aufgelistete Einzelformationen. […] Nennung vieler Quellen, deren Zuordnung zu einzelnen Aussagen ist oft nicht konkret.”</td>
                <td>“‚Repetition of many sentences and contents; pronounced tendency towards certain template-like formulations in the sense of a ‘presentation’, sometimes phrase-like without content. Visually well structured (given by the headings), but a common thread is not easily recognizable, many things appear to be merely a list of individual formations. [...] Mention of many sources, their assignment to individual statements is often not concrete.”</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Estimated probability of thinking of ChatGPT as authorship.</p>
          </caption>
          <graphic xlink:href="mededu_v11i1e62779_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Overview</title>
        <p>This analysis offers insights into the current identification rate of AI-generated texts and their evaluation compared with medical student texts by 2 different expert groups. It also provides an initial overview of the decision-making processes of medical and humanities experts during these assessments. Our findings suggest that both medical and humanities experts can effectively identify ChatGPT-generated texts in medical contexts and that linguistic and stylistic features play a significant role in distinguishing AI-generated from human-written texts, regardless of content familiarity. This supports the broader notion that linguistic analysis is crucial in identifying AI-generated text, aligning with foundational theories in human-robot interaction, such as Turing’s predictions [<xref ref-type="bibr" rid="ref32">32</xref>].</p>
      </sec>
      <sec>
        <title>Identification Rate</title>
        <p>In the 1950s, Alan Turing [<xref ref-type="bibr" rid="ref32">32</xref>] predicted that within 50 years, AI would advance to the point where the likelihood of identifying a machine as nonhuman in a dialogue or an “imitation game” would be no more than 70% [<xref ref-type="bibr" rid="ref32">32</xref>]. With a slight delay of about 20 years, his prediction was almost precisely fulfilled in an online game inspired by the Turing Test [<xref ref-type="bibr" rid="ref5">5</xref>]. Unlike Turing’s method and the large-scale Israeli study, our research did not involve direct dialogue between humans and machines [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. However, when participants were presented with 2 texts of different authorship, an internal dialogue was essential for making an authorship determination. Ultimately, our study’s main finding aligns almost exactly with Turing’s prediction: only in 48 out of 69 (70%) decision rounds, participants correctly identified the ChatGPT-generated text. This accuracy rate remained consistent regardless of whether participants were experts in the content of the text or in linguistic analysis, and irrespective of their prior experience with ChatGPT. Notably, familiarity with the subject matter did not appear to be a decisive factor, as humanities experts performed similarly to medical experts who specialized in the respective topics. Moreover, at the individual participant level, no significant differences were found between the 2 expert groups in terms of their proximity to the text’s subject matter.</p>
        <p>A Chinese study by Ma et al [<xref ref-type="bibr" rid="ref2">2</xref>], which also examined the identification rate of chatbot-generated texts, reported similar findings, with approximately 66% of texts correctly identified. This study analyzed around 40 scientific texts, including 20 scientific paper abstracts and 20 wiki item descriptions, assessed by 2 PhD students with a background in computer science [<xref ref-type="bibr" rid="ref2">2</xref>]. Ma et al [<xref ref-type="bibr" rid="ref2">2</xref>] also highlighted notable differences in writing style between AI-generated and human-written scientific texts, a conclusion that aligns with our findings. In our study, participants primarily based their decisions on text-analytical features, while content errors influenced their judgment in only 3 instances.</p>
        <p>The study by Waltzer et al [<xref ref-type="bibr" rid="ref36">36</xref>], which closely resembles our research in design, reported similar findings. In their study, 140 college instructors were presented with pairs of essays and correctly identified the ChatGPT-generated text 70% of the time. Like our results, Waltzer et al [<xref ref-type="bibr" rid="ref36">36</xref>] found that neither prior experience with ChatGPT nor subject-specific expertise—measured by self-reported familiarity with the topic—significantly improved identification accuracy [<xref ref-type="bibr" rid="ref36">36</xref>]. However, a key difference is that their study analyzed English-language essays written for a psychology program, whereas our research focused on German-language texts authored by medical students [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
      </sec>
      <sec>
        <title>Performance</title>
        <p>The evaluation of a text can focus on different levels and aspects, often emphasizing either content or linguistic features. Currently, AI programs such as ChatGPT are recognized for their seemingly perfected linguistic style [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. A notable case at a German university (TU Munich) illustrates this: an essay submitted as part of a Master’s application was rejected—and this decision was upheld by a court—on the grounds that it was “too well written,” strongly suggesting AI authorship [<xref ref-type="bibr" rid="ref13">13</xref>]. However, it is important to note that this essay was written in English [<xref ref-type="bibr" rid="ref13">13</xref>]. While ChatGPT is also proficient in translating languages such as German and Chinese [<xref ref-type="bibr" rid="ref15">15</xref>], its performance in German differs from English. Research suggests that AI-generated texts tend to be more nuanced and varied in English than in German [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. This discrepancy is likely due to the greater availability of digital data in English, which results in more refined and contextually accurate outputs. Nevertheless, AI language models continuously improve as they interact with users, enhancing their capabilities in non–English languages over time.</p>
        <p>Interestingly, the humanities group, despite their focus on linguistic features, identified ChatGPT-generated texts less accurately than the medical expert group—though this difference was not statistically significant. Notably, humanities experts rated the linguistic quality of ChatGPT texts higher than those written by medical students, a contrast that was significant compared with the evaluations of the medical experts. The decision-making process behind text identification revealed key patterns: participants were more likely to suspect a human author when encountering spelling and grammatical errors, greater variation in sentence structure, medical-specific terminology, a writing style aimed at a professional readership, or shifts in citation style.</p>
        <p>An “AI author,” by contrast, was suspected if there was a monotonous sentence structure, partly “English” grammar, a “smooth” wording style, that is, good readability/understandability, but overall more superficial, an intended less professional readership, better overall formal structure of the text (derivation, outline, weft), frequent repetitions, and a lack of supra-textual coherence of the argumentation in contrast to the coherent and easily comprehensible sequence of arguments within individual paragraphs.</p>
        <p>Many studies explored the identifiability of chatbot-generated text using machine learning–based detectors, a subset of AI technologies [<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref29">29</xref>]. These detectors often achieve higher identification rates than human evaluators. However, direct human comparison is rarely included, and accuracy and <italic>F</italic><sub>1</sub>-scores vary significantly depending on the text genre and the specific machine learning classifier used. For instance, when various LLM-based classifiers are applied to different data sets, their accuracy ranges from 70% (DetectGPT classifier on Wikipedia articles) to 97% (GPT-Pat classifier on COVID-19–related question-answer data sets). Similarly, perplexity-based classifiers achieve around 70% accuracy on ACL paper abstracts, whereas RoBERTa (Robustly Optimized BERT Pretraining Approach)–based classifiers reach up to 97% on COVID-19–related data sets [<xref ref-type="bibr" rid="ref37">37</xref>].</p>
        <p>Another challenge is that while these tools are generally reliable in detecting AI-generated text, they are not always sufficiently accurate in identifying human-authored text. This suggests that the tools may struggle with the complexity of human writing while also highlighting a key limitation—especially in cases where a lecturer, for example, must evaluate a single piece of writing without comparison [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref31">31</xref>].</p>
        <p>Our study also compares the performance of medical students and ChatGPT. Notably, the texts written by medical students received higher professional evaluations. However, the humanities experts specifically rated the linguistic quality of ChatGPT-generated texts more favorably. Additionally, when comparing ChatGPT’s performance with that of medical students in an examination setting—such as in the study by Huh [<xref ref-type="bibr" rid="ref38">38</xref>]—ChatGPT performed worse than medical students [<xref ref-type="bibr" rid="ref31">31</xref>]. In a parasitology examination, ChatGPT correctly answered 60.8% of the questions, whereas the average score among 77 medical students was significantly higher at 90.8% [<xref ref-type="bibr" rid="ref38">38</xref>]. In comparison, a German study by Friederichs et al [<xref ref-type="bibr" rid="ref39">39</xref>] found that ChatGPT correctly answered two-thirds of all multiple-choice questions at the level of the German state licensing examination in the Progress Test Medicine. It even outperformed most medical students in their first 3 years and performed comparably to students in the later stages of their studies [<xref ref-type="bibr" rid="ref39">39</xref>]. Our study also revealed that participants who overestimated ChatGPT’s writing capabilities and underestimated those of the students were more likely to misidentify the author. This misconception was particularly evident in cases where participants misclassified texts in both sessions, suggesting that their biased perception significantly influenced their decisions.</p>
      </sec>
      <sec>
        <title>Interpretation</title>
        <p>Our study demonstrates that the identification rate predicted by Turing holds within a group primarily engaged in student teaching and academic writing. Our findings confirm the expectation that linguistic features play a more significant role in identifying AI-generated texts than content familiarity or specialized expertise. In both expert groups, text-analytical features were the primary factors influencing their decisions. This aligns with the emerging field of stylometric analysis, which is increasingly being applied to the detection of AI-generated content [<xref ref-type="bibr" rid="ref40">40</xref>]. ChatGPT-generated text, especially in comparison to authors from the (fictional) literature domain, exhibits limited stylistic variety [<xref ref-type="bibr" rid="ref41">41</xref>]. Notably, there was no significant difference in the identification rate between the 2 expert groups, despite 1 being more familiar with the subject matter. Higher proximity to the topic was also not a predictive factor at the individual participant level. Instead, certain linguistic characteristics played a key role in the decision-making process and were consistently associated with AI-generated texts. In particular, redundancy, repetition, and a lack of coherence were distinctive features attributed to ChatGPT-generated texts. While these traits influenced the perception of AI authorship, they ultimately did not prove to be reliable predictors for correct identification. The linguistic features of ChatGPT-generated texts are often perceived as superior due to their smoother wording and better structural organization. This aligns with findings from [<xref ref-type="bibr" rid="ref42">42</xref>], which indicate that AI-generated texts tend to exhibit relatively low lexical density, high reading ease, and frequent use of the simple present tense. Whether these linguistic characteristics, if systematically outlined in a manual and provided to participants beforehand, could enhance identification accuracy remains an open question. However, this presents an intriguing avenue for future research.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>While numerous studies are currently investigating the performance of LLM-based text generators such as ChatGPT, many focus primarily on their assistive role in the writing process rather than assessing the quality of fully generated long-form scientific texts. A key contribution of our study is that it examines complete, AI-generated scientific texts rather than partial outputs. Additionally, instead of relying on specialized AI detection tools, we analyze how individuals working in academia recognize such texts without assistance and how they evaluate their performance while identifying distinct linguistic features. This study enables the compilation of categorical features that could aid in identifying AI-generated text in both academic and everyday reading. However, limitations in generalizability arise due to the relatively small sample size and the exclusive use of a single AI model, ChatGPT version 3.5. Nevertheless, for an exploratory study, we do not consider this a critical issue. Additionally, participants were aware that 1 of the texts had to be AI-generated, raising the question of whether they would have identified an AI-authored text without this prior knowledge. A further limitation arises from the use of different interviewers for the 2 expert groups, who also differed methodologically in terms of blinding. However, it should be noted that the decision to identify the authors was always made before the interview process. Additionally, the interview was transcribed in bullet points, so some information may have been lost in this process. Finally, the dynamic nature of development should also be acknowledged, as ChatGPT, like other AI programs, is continuously being developed and improved.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>Our study shows that linguistic and text-analytical features, in particular, play a role in the decision-making process for correctly identifying a chatbot author. In our sample, both nonspecialists and specialists identified AI-generated texts with an accuracy rate of approximately 70% (48/69). Further quasi-experimental studies using texts from other academic disciplines should be conducted to determine whether instructions based on these features can enhance lecturers’ ability to distinguish between student-authored and AI-generated work.</p>
        <p>A follow-up study could be conducted in a few years to track the evolution of AI-generated text identification and examine whether identification success changes as AI technology and tools advance.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Questionnaire with English translation and abbreviation label.</p>
        <media xlink:href="mededu_v11i1e62779_app1.docx" xlink:title="DOCX File , 15 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Categories for the qualitative analysis, created from the various reasons given in free form for the decision on the authorship of a text.</p>
        <media xlink:href="mededu_v11i1e62779_app2.docx" xlink:title="DOCX File , 18 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">RoBERTa</term>
          <def>
            <p>Robustly Optimized BERT Pretraining Approach</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">RUB</term>
          <def>
            <p>Ruhr University Bochum</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors thank the students for providing their work. We also extend our gratitude to our colleagues at the Paediatric and Neurological University Clinics of the Ruhr-University of Bochum, as well as the teachers at the Department of Philology, for their voluntary participation, contributions, and suggestions. Additionally, we thank the Medical Dean of Studies, Prof. T. Schäfer, for the initial exchange, and Dr. A. Lucke for her critical endorsement of our work.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>BD and JSB contributed equally to conceptualization and data acquisition, with BD leading the qualitative analysis and the original draft writing. CM played a leading role in conceptualization, supervision, and writing—review and editing—while contributing equally to formal analysis and data acquisition. TL and MB shared equal responsibilities in supervision and writing—review and editing. JS contributed equally to conceptualization, qualitative analysis, and writing, whereas EEK was involved in writing—review and editing on an equal basis. SH took the lead in proofreading and contributed equally to review and editing. MT led the formal analysis while sharing equal responsibilities in supervision and writing—review and editing. All authors have reviewed and approved the final manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jannai</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Meron</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lenz</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Levine</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shoham</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Human or not? A gamified approach to the Turing Test</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on January 30, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.2305.20010"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>AI vs. human -- differentiation analysis of scientific content generation</article-title>
          <source>arXiv</source>
          <access-date>2023-05-01</access-date>
          <comment>Preprint posted online on January 21, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.2301.10416">https://doi.org/10.48550/arXiv.2301.10416</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>von Garrel</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mayer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mühlfeld</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>Hochschule Darmstadt</source>
          <year>2023</year>
          <access-date>2024-11-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48444/h_docs-pub-395">https://doi.org/10.48444/h_docs-pub-395</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
          <article-title>ChatGPT: optimizing language models for dialogue</article-title>
          <source>OpenAI</source>
          <access-date>2023-07-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://openai.com/blog/chatgpt/">https://openai.com/blog/chatgpt/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Taecharungroj</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>“What can ChatGPT do?” Analyzing early reactions to the innovative AI chatbot on Twitter</article-title>
          <source>BDCC</source>
          <year>2023</year>
          <month>02</month>
          <day>16</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>35</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3390/bdcc7010035"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/bdcc7010035</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Berdejo-Espinola</surname>
              <given-names>Violeta</given-names>
            </name>
            <name name-style="western">
              <surname>Amano</surname>
              <given-names>Tatsuya</given-names>
            </name>
          </person-group>
          <article-title>AI tools can improve equity in science</article-title>
          <source>Science</source>
          <year>2023</year>
          <month>03</month>
          <day>10</day>
          <volume>379</volume>
          <issue>6636</issue>
          <fpage>991</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1126/science.adg9714"/>
          </comment>
          <pub-id pub-id-type="doi">10.1126/science.adg9714</pub-id>
          <pub-id pub-id-type="medline">36893248</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Marx</surname>
              <given-names>JPS</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT im studium: die top 10 befehle für effektives Lernen</article-title>
          <source>Shribe</source>
          <year>2023</year>
          <access-date>2024-11-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://shribe.de/chatgpt-studium/">https://shribe.de/chatgpt-studium/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arif</surname>
              <given-names>TB</given-names>
            </name>
            <name name-style="western">
              <surname>Munaf</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Ul-Haque</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>The future of medical education and research: is ChatGPT a blessing or blight in disguise?</article-title>
          <source>Med Educ Online</source>
          <year>2023</year>
          <month>12</month>
          <day>21</day>
          <volume>28</volume>
          <issue>1</issue>
          <fpage>2181052</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.tandfonline.com/doi/abs/10.1080/10872981.2023.2181052?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:crossref.org&amp;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/10872981.2023.2181052</pub-id>
          <pub-id pub-id-type="medline">36809073</pub-id>
          <pub-id pub-id-type="pmcid">PMC9946299</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>Edmond Pui Hang</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Jung Jae</given-names>
            </name>
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>Mu-Hsing</given-names>
            </name>
            <name name-style="western">
              <surname>Kwok</surname>
              <given-names>Jojo Yan Yan</given-names>
            </name>
            <name name-style="western">
              <surname>Lok</surname>
              <given-names>Kris Yuet Wan</given-names>
            </name>
          </person-group>
          <article-title>Chatting or cheating? The impacts of ChatGPT and other artificial intelligence language models on nurse education</article-title>
          <source>Nurse Educ Today</source>
          <year>2023</year>
          <month>06</month>
          <volume>125</volume>
          <fpage>105796</fpage>
          <pub-id pub-id-type="doi">10.1016/j.nedt.2023.105796</pub-id>
          <pub-id pub-id-type="medline">36934624</pub-id>
          <pub-id pub-id-type="pii">S0260-6917(23)00090-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Flanagin</surname>
              <given-names>Annette</given-names>
            </name>
            <name name-style="western">
              <surname>Bibbins-Domingo</surname>
              <given-names>Kirsten</given-names>
            </name>
            <name name-style="western">
              <surname>Berkwits</surname>
              <given-names>Michael</given-names>
            </name>
            <name name-style="western">
              <surname>Christiansen</surname>
              <given-names>Stacy L</given-names>
            </name>
          </person-group>
          <article-title>Nonhuman "authors" and implications for the integrity of scientific publication and medical knowledge</article-title>
          <source>JAMA</source>
          <year>2023</year>
          <month>02</month>
          <day>28</day>
          <volume>329</volume>
          <issue>8</issue>
          <fpage>637</fpage>
          <lpage>639</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1001/jama.2023.1344"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jama.2023.1344</pub-id>
          <pub-id pub-id-type="medline">36719674</pub-id>
          <pub-id pub-id-type="pii">2801170</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>Yiqiu</given-names>
            </name>
            <name name-style="western">
              <surname>Heacock</surname>
              <given-names>Laura</given-names>
            </name>
            <name name-style="western">
              <surname>Elias</surname>
              <given-names>Jonathan</given-names>
            </name>
            <name name-style="western">
              <surname>Hentel</surname>
              <given-names>Keith D</given-names>
            </name>
            <name name-style="western">
              <surname>Reig</surname>
              <given-names>Beatriu</given-names>
            </name>
            <name name-style="western">
              <surname>Shih</surname>
              <given-names>George</given-names>
            </name>
            <name name-style="western">
              <surname>Moy</surname>
              <given-names>Linda</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT and other large language models are double-edged swords</article-title>
          <source>Radiology</source>
          <year>2023</year>
          <month>04</month>
          <volume>307</volume>
          <issue>2</issue>
          <fpage>e230163</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1148/radiol.230163"/>
          </comment>
          <pub-id pub-id-type="doi">10.1148/radiol.230163</pub-id>
          <pub-id pub-id-type="medline">36700838</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Connor</surname>
              <given-names>Siobhan</given-names>
            </name>
          </person-group>
          <article-title>Open artificial intelligence platforms in nursing education: tools for academic progress or abuse?</article-title>
          <source>Nurse Educ Pract</source>
          <year>2023</year>
          <month>01</month>
          <volume>66</volume>
          <fpage>103537</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.nepr.2022.103537"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.nepr.2022.103537</pub-id>
          <pub-id pub-id-type="medline">36549229</pub-id>
          <pub-id pub-id-type="pii">S1471-5953(22)00251-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zenthöfer</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Erstes urteil zu ChatGPT an hochschulen</article-title>
          <source>FAZ</source>
          <year>2024</year>
          <access-date>2024-05-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.faz.net/aktuell/karriere-hochschule/student-nutzt-chatgpt-fuer-bewerbung-erstes-urteil-zu-ki-an-hochschulen-19564795.html">https://www.faz.net/aktuell/karriere-hochschule/student-nutzt-chatgpt-fuer-bewerbung-erstes-urteil-zu-ki-an-hochschulen-19564795.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abburi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Roy</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Suesserman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pudota</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Veeramani</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Bowen</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bhattacharya</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A simple yet efficient ensemble approach for AI-generated text detection</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on January 23, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.2311.03084"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jiao</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Is ChatGPT a good translator? A preliminary  study</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on January 14, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.2301.08745"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Richtscheid</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Some hints for the use of “chatGPT” when using with German input language</article-title>
          <source>Medium</source>
          <year>2023</year>
          <access-date>2023-07-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medium.com/@walter.richtscheid_93860/notes-on-the-use-of-chatgpt-in-german-language-c4941a14da54">https://medium.com/@walter.richtscheid_93860/notes-on-the-use-of-chatgpt-in-german-language-c4941a14da54</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>De Vries</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Lucke</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Alexa</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Computergenerierter Zufall als kreatives Moment in Malerei und Literatur.  Potentiale und Grenzen von Machine-Learning-Modellen am Beispiel von GPT</article-title>
          <source>Literaturwissenschaft und Informatik. Transdisziplinäre Perspektiven, digitale Methoden und selbstlernende Algorithmen</source>
          <year>2024</year>
          <publisher-loc>Bielefeld, Germany</publisher-loc>
          <publisher-name>Universität Bielefeld</publisher-name>
          <fpage>93</fpage>
          <lpage>121</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Corizzo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Leal-Arenas</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>One-GPT: a one-class deep fusion model for machine-generated text detection</article-title>
          <year>2023</year>
          <conf-name>IEEE International Conference on Big Data (BigData)</conf-name>
          <conf-date>December 15-18, 2023</conf-date>
          <conf-loc>Sorrento, Italy</conf-loc>
          <fpage>5743</fpage>
          <lpage>5752</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Parviainen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rantala</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Chatbot breakthrough in the 2020s? An ethical reflection on the trend of automated consultations in health care</article-title>
          <source>Med Health Care Philos</source>
          <year>2022</year>
          <month>03</month>
          <day>04</day>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>61</fpage>
          <lpage>71</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34480711"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11019-021-10049-w</pub-id>
          <pub-id pub-id-type="medline">34480711</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11019-021-10049-w</pub-id>
          <pub-id pub-id-type="pmcid">PMC8416570</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alturaiki</surname>
              <given-names>Alma Mohammed</given-names>
            </name>
            <name name-style="western">
              <surname>Banjar</surname>
              <given-names>Haneen Reda</given-names>
            </name>
            <name name-style="western">
              <surname>Barefah</surname>
              <given-names>Ahmed Salleh</given-names>
            </name>
            <name name-style="western">
              <surname>Alnajjar</surname>
              <given-names>Salwa Abdulrahman</given-names>
            </name>
            <name name-style="western">
              <surname>Hindawi</surname>
              <given-names>Salwa</given-names>
            </name>
          </person-group>
          <article-title>A smart chatbot for interactive management in beta thalassemia patients</article-title>
          <source>Int J Telemed Appl</source>
          <year>2022</year>
          <volume>2022</volume>
          <fpage>9734518</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1155/2022/9734518"/>
          </comment>
          <pub-id pub-id-type="doi">10.1155/2022/9734518</pub-id>
          <pub-id pub-id-type="medline">35601050</pub-id>
          <pub-id pub-id-type="pmcid">PMC9117039</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bin Sawad</surname>
              <given-names>Abdullah</given-names>
            </name>
            <name name-style="western">
              <surname>Narayan</surname>
              <given-names>Bhuva</given-names>
            </name>
            <name name-style="western">
              <surname>Alnefaie</surname>
              <given-names>Ahlam</given-names>
            </name>
            <name name-style="western">
              <surname>Maqbool</surname>
              <given-names>Ashwaq</given-names>
            </name>
            <name name-style="western">
              <surname>Mckie</surname>
              <given-names>Indra</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>Jemma</given-names>
            </name>
            <name name-style="western">
              <surname>Yuksel</surname>
              <given-names>Berkan</given-names>
            </name>
            <name name-style="western">
              <surname>Puthal</surname>
              <given-names>Deepak</given-names>
            </name>
            <name name-style="western">
              <surname>Prasad</surname>
              <given-names>Mukesh</given-names>
            </name>
            <name name-style="western">
              <surname>Kocaballi</surname>
              <given-names>A Baki</given-names>
            </name>
          </person-group>
          <article-title>A systematic review on healthcare artificial intelligent conversational agents for chronic conditions</article-title>
          <source>Sensors (Basel)</source>
          <year>2022</year>
          <month>03</month>
          <day>29</day>
          <volume>22</volume>
          <issue>7</issue>
          <fpage>1</fpage>
          <lpage>20</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=s22072625"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/s22072625</pub-id>
          <pub-id pub-id-type="medline">35408238</pub-id>
          <pub-id pub-id-type="pii">s22072625</pub-id>
          <pub-id pub-id-type="pmcid">PMC9003264</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence-assisted psychosis risk screening in adolescents: practices and challenges</article-title>
          <source>World J Psychiatry</source>
          <year>2022</year>
          <month>10</month>
          <day>19</day>
          <volume>12</volume>
          <issue>10</issue>
          <fpage>1287</fpage>
          <lpage>1297</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.wjgnet.com/2220-3206/full/v12/i10/1287.htm"/>
          </comment>
          <pub-id pub-id-type="doi">10.5498/wjp.v12.i10.1287</pub-id>
          <pub-id pub-id-type="medline">36389087</pub-id>
          <pub-id pub-id-type="pmcid">PMC9641379</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gaffney</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Mansell</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Tai</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Conversational agents in the treatment of mental health problems: mixed-method systematic review</article-title>
          <source>JMIR Ment Health</source>
          <year>2019</year>
          <month>10</month>
          <day>18</day>
          <volume>6</volume>
          <issue>10</issue>
          <fpage>e14166</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mental.jmir.org/2019/10/e14166/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/14166</pub-id>
          <pub-id pub-id-type="medline">31628789</pub-id>
          <pub-id pub-id-type="pii">v6i10e14166</pub-id>
          <pub-id pub-id-type="pmcid">PMC6914342</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schick</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Feine</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Morana</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Maedche</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Reininghaus</surname>
              <given-names>U</given-names>
            </name>
          </person-group>
          <article-title>Validity of chatbot use for mental health assessment: experimental study</article-title>
          <source>JMIR Mhealth Uhealth</source>
          <year>2022</year>
          <month>10</month>
          <day>31</day>
          <volume>10</volume>
          <issue>10</issue>
          <fpage>e28082</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mhealth.jmir.org/2022/10/e28082/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/28082</pub-id>
          <pub-id pub-id-type="medline">36315228</pub-id>
          <pub-id pub-id-type="pii">v10i10e28082</pub-id>
          <pub-id pub-id-type="pmcid">PMC9664331</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Differentiating ChatGPT-generated and human-written medical texts: quantitative study</article-title>
          <source>JMIR Med Educ</source>
          <year>2023</year>
          <month>12</month>
          <day>28</day>
          <volume>9</volume>
          <fpage>e48904</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2023//e48904/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/48904</pub-id>
          <pub-id pub-id-type="medline">38153785</pub-id>
          <pub-id pub-id-type="pii">v9i1e48904</pub-id>
          <pub-id pub-id-type="pmcid">PMC10784984</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khairatun Hisan</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Miftahul Amri</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT and medical education: a double-edged sword</article-title>
          <source>Journal of Pedagogy and Education Science</source>
          <year>2023</year>
          <month>03</month>
          <day>11</day>
          <volume>2</volume>
          <issue>01</issue>
          <fpage>71</fpage>
          <lpage>89</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.56741/jpes.v2i01.302"/>
          </comment>
          <pub-id pub-id-type="doi">10.56741/jpes.v2i01.302</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hayawi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Shahriar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mathew</surname>
              <given-names>Ss</given-names>
            </name>
          </person-group>
          <article-title>The imitation game: detecting human and AI-generated texts in the era of ChatGPT and BARD</article-title>
          <source>Journal of Information Science</source>
          <year>2024</year>
          <month>02</month>
          <day>14</day>
          <volume>The Imitation Game</volume>
          <fpage>1</fpage>
          <lpage>36</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.2307.12166"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/01655515241227531</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Orenstrakh</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Karnalim</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Suarez</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Liut</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Detecting LLM-generated text in computing education: a comparative study for ChatGPT cases</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on January 17, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.2307.07411"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/compsac61105.2024.00027</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mitrovic</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Andreoletti</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ayoub</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT or human? Detect and explain. Explaining decisions of machine learning model for detecting short ChatGPT-generated text</article-title>
          <source>arXiv</source>
          <access-date>2023-05-01</access-date>
          <comment>Preprint posted online on January 11, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.2301.13852">https://doi.org/10.48550/arXiv.2301.13852</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fröhling</surname>
              <given-names>Leon</given-names>
            </name>
            <name name-style="western">
              <surname>Zubiaga</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Feature-based detection of automated language models: tackling GPT-2, GPT-3 and Grover</article-title>
          <source>PeerJ Comput Sci</source>
          <year>2021</year>
          <volume>7</volume>
          <fpage>e443</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33954234"/>
          </comment>
          <pub-id pub-id-type="doi">10.7717/peerj-cs.443</pub-id>
          <pub-id pub-id-type="medline">33954234</pub-id>
          <pub-id pub-id-type="pii">cs-443</pub-id>
          <pub-id pub-id-type="pmcid">PMC8049133</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Elkhatat</surname>
              <given-names>Am</given-names>
            </name>
            <name name-style="western">
              <surname>Elsaid</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Almeer</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the efficacy of AI content detection tools in differentiating between human and AI-generated text</article-title>
          <source>Int J Educ Integr</source>
          <year>2023</year>
          <month>09</month>
          <day>01</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>17</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1007/s40979-023-00140-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s40979-023-00140-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Turing</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Computing machinery and intelligence</article-title>
          <source>Mind</source>
          <year>1950</year>
          <month>10</month>
          <day>01</day>
          <volume>LIX</volume>
          <issue>236</issue>
          <fpage>433</fpage>
          <lpage>460</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1093/mind/LIX.236.433"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/mind/lix.236.433</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schäer</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <source>Einführung in Die Grammatische Beschreibung des Deutschen: Dritte</source>
          <year>2018</year>
          <publisher-loc>Berlin, Germany</publisher-loc>
          <publisher-name>Language Science Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fobbe</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <source>Forensische Linguistik: Eine Einführung</source>
          <year>2011</year>
          <publisher-loc>Tübingen, Germany</publisher-loc>
          <publisher-name>Narr Francke Attempto Verlag</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hessler</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <source>Autorschaftserkennung und Verstellungsstrategien: Textanalysen und-vergleiche im Spektrum forensischer Linguistik, Informationssicherheit und Machine-Learning (Volume 585)</source>
          <year>2023</year>
          <publisher-loc>Tübingen, Germany</publisher-loc>
          <publisher-name>Narr Francke Attempto Verlag</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Waltzer</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Pilegard</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Heyman</surname>
              <given-names>GD</given-names>
            </name>
          </person-group>
          <article-title>Can you spot the bot? Identifying AI-generated writing in college essays</article-title>
          <source>Int J Educ Integr</source>
          <year>2024</year>
          <month>07</month>
          <day>08</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>11</fpage>
          <pub-id pub-id-type="doi">10.1007/s40979-024-00158-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Qi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>LLM paternity test: generated text detection with LLM genetic inheritance</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on January 30, 2024</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.2305.12519"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huh</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Are ChatGPT's knowledge and interpretation ability comparable to those of medical students in Korea for taking a parasitology examination?: a descriptive study</article-title>
          <source>J Educ Eval Health Prof</source>
          <year>2023</year>
          <month>01</month>
          <day>11</day>
          <volume>20</volume>
          <fpage>1</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3352/jeehp.2023.20.1"/>
          </comment>
          <pub-id pub-id-type="doi">10.3352/jeehp.2023.20.01</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Friederichs</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Friederichs</surname>
              <given-names>WJ</given-names>
            </name>
            <name name-style="western">
              <surname>März</surname>
              <given-names>Maren</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT in medical school: how successful is AI in progress testing?</article-title>
          <source>Med Educ Online</source>
          <year>2023</year>
          <month>12</month>
          <volume>28</volume>
          <issue>1</issue>
          <fpage>2220920</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.tandfonline.com/doi/abs/10.1080/10872981.2023.2220920?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:crossref.org&amp;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/10872981.2023.2220920</pub-id>
          <pub-id pub-id-type="medline">37307503</pub-id>
          <pub-id pub-id-type="pmcid">PMC10262795</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Uzun</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT and academic integrity concerns: detecting artificial intelligence generated content</article-title>
          <source>Language Education &amp; Technology</source>
          <year>2023</year>
          <access-date>2024-02-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.langedutech.com/letjournal/index.php/let/article/view/49/36">https://www.langedutech.com/letjournal/index.php/let/article/view/49/36</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zwilling</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Berger</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT does not speak style!</article-title>
          <year>2024</year>
          <conf-name>Computational Linguistics Poster Session at the 46th Annual Meeting of the German Linguistic Society (DGfS)</conf-name>
          <conf-date>February 28, 2024</conf-date>
          <conf-loc>Bochum, Germany</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>AlAfnan</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Mohdzuki</surname>
              <given-names>SF</given-names>
            </name>
          </person-group>
          <article-title>Do artificial intelligence chatbots have a writing style? An investigation into the stylistic features of ChatGPT-4</article-title>
          <source>Journal of Artificial Intelligence and Technology</source>
          <year>2023</year>
          <month>05</month>
          <day>12</day>
          <volume>3</volume>
          <fpage>3</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchgate.net/publication/370715677_Do_Artificial_Intelligence_Chatbots_Have_a_Writing_Style_An_Investigation_into_the_Stylistic_Features_of_ChatGPT-4"/>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
