<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Educ</journal-id><journal-id journal-id-type="publisher-id">mededu</journal-id><journal-id journal-id-type="index">20</journal-id><journal-title>JMIR Medical Education</journal-title><abbrev-journal-title>JMIR Med Educ</abbrev-journal-title><issn pub-type="epub">2369-3762</issn></journal-meta><article-meta><article-id pub-id-type="publisher-id">52674</article-id><article-id pub-id-type="doi">10.2196/52674</article-id><title-group><article-title>Importance of Patient History in Artificial Intelligence&#x2013;Assisted Medical Diagnosis: Comparison Study</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Fukuzawa</surname><given-names>Fumitoshi</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Yanagita</surname><given-names>Yasutaka</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Yokokawa</surname><given-names>Daiki</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Uchida</surname><given-names>Shun</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Yamashita</surname><given-names>Shiho</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Li</surname><given-names>Yu</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Shikino</surname><given-names>Kiyoshi</given-names></name><degrees>MD, MHPE, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Tsukamoto</surname><given-names>Tomoko</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Noda</surname><given-names>Kazutaka</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Uehara</surname><given-names>Takanori</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ikusaka</surname><given-names>Masatomi</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Department of General Medicine, Chiba University Hospital</institution>, <addr-line>Chiba-shi</addr-line>, <country>Japan</country></aff><aff id="aff2"><institution>Uchida Internal Medicine Clinic</institution>, <addr-line>Saitama-shi</addr-line>, <country>Japan</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Chartash</surname><given-names>David</given-names></name></contrib><contrib contrib-type="editor"><name name-style="western"><surname>Eysenbach</surname><given-names>Gunther</given-names></name></contrib><contrib contrib-type="editor"><name name-style="western"><surname>Cardoso</surname><given-names>Taiane de Azevedo</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Baxter</surname><given-names>Clarence</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Sun</surname><given-names>Hao</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Fumitoshi Fukuzawa, MD<email>f.fukuzawa0919@ymail.ne.jp</email></corresp></author-notes><pub-date pub-type="collection"><year>2024</year></pub-date><pub-date pub-type="epub"><day>8</day><month>4</month><year>2024</year></pub-date><volume>10</volume><elocation-id>e52674</elocation-id><history><date date-type="received"><day>12</day><month>09</month><year>2023</year></date><date date-type="rev-recd"><day>31</day><month>01</month><year>2024</year></date><date date-type="accepted"><day>15</day><month>02</month><year>2024</year></date></history><copyright-statement>&#x00A9; Fumitoshi Fukuzawa, Yasutaka Yanagita, Daiki Yokokawa, Shun Uchida, Shiho Yamashita, Yu Li, Kiyoshi Shikino, Tomoko Tsukamoto, Kazutaka Noda, Takanori Uehara, Masatomi Ikusaka. Originally published in JMIR Medical Education (<ext-link ext-link-type="uri" xlink:href="https://mededu.jmir.org">https://mededu.jmir.org</ext-link>), 8.4.2024. </copyright-statement><copyright-year>2024</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Education, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://mededu.jmir.org/">https://mededu.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://mededu.jmir.org/2024/1/e52674"/><abstract><sec><title>Background</title><p>Medical history contributes approximately 80% to a diagnosis, although physical examinations and laboratory investigations increase a physician&#x2019;s confidence in the medical diagnosis. The concept of artificial intelligence (AI) was first proposed more than 70 years ago. Recently, its role in various fields of medicine has grown remarkably. However, no studies have evaluated the importance of patient history in AI-assisted medical diagnosis.</p></sec><sec><title>Objective</title><p>This study explored the contribution of patient history to AI-assisted medical diagnoses and assessed the accuracy of ChatGPT in reaching a clinical diagnosis based on the medical history provided.</p></sec><sec sec-type="methods"><title>Methods</title><p>Using clinical vignettes of 30 cases identified in <italic>The BMJ</italic>, we evaluated the accuracy of diagnoses generated by ChatGPT. We compared the diagnoses made by ChatGPT based solely on medical history with the correct diagnoses. We also compared the diagnoses made by ChatGPT after incorporating additional physical examination findings and laboratory data alongside history with the correct diagnoses.</p></sec><sec sec-type="results"><title>Results</title><p>ChatGPT accurately diagnosed 76.6% (23/30) of the cases with only the medical history, consistent with previous research targeting physicians. We also found that this rate was 93.3% (28/30) when additional information was included.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Although adding additional information improves diagnostic accuracy, patient history remains a significant factor in AI-assisted medical diagnosis. Thus, when using AI in medical diagnosis, it is crucial to include pertinent and correct patient histories for an accurate diagnosis. Our findings emphasize the continued significance of patient history in clinical diagnoses in this age and highlight the need for its integration into AI-assisted medical diagnosis systems.</p></sec></abstract><kwd-group><kwd>medical diagnosis</kwd><kwd>ChatGPT</kwd><kwd>AI in medicine</kwd><kwd>diagnostic accuracy</kwd><kwd>patient history</kwd><kwd>medical history</kwd><kwd>artificial intelligence</kwd><kwd>AI</kwd><kwd>physical examination</kwd><kwd>physical examinations</kwd><kwd>laboratory investigation</kwd><kwd>laboratory investigations</kwd><kwd>mHealth</kwd><kwd>accuracy</kwd><kwd>public health</kwd><kwd>United States</kwd><kwd>AI diagnosis</kwd><kwd>treatment</kwd><kwd>male</kwd><kwd>female</kwd><kwd>child</kwd><kwd>children</kwd><kwd>youth</kwd><kwd>adolescent</kwd><kwd>adolescents</kwd><kwd>teen</kwd><kwd>teens</kwd><kwd>teenager</kwd><kwd>teenagers</kwd><kwd>older adult</kwd><kwd>older adults</kwd><kwd>elder</kwd><kwd>elderly</kwd><kwd>older person</kwd><kwd>older people</kwd><kwd>investigative</kwd><kwd>mobile health</kwd><kwd>digital health</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Over the past decade, medical knowledge and diagnostic techniques have expanded globally and have become more accessible with remarkable advancements in clinical testing and useful reference systems. Despite these advancements, misdiagnosis significantly contributes to mortality, making it a significant public health issue [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. Studies have shown discrepancies between clinical and postmortem autopsy diagnoses in at least 25% of patients [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref7">7</xref>]. One study suggests that approximately 40,500 adult patients in intensive care units in the United States die of misdiagnoses annually, and the predicted prevalence of potentially lethal misdiagnoses is 6.3% [<xref ref-type="bibr" rid="ref8">8</xref>]. Another report suggests that diagnostic errors contribute to approximately 10% of deaths and 6% to 17% of hospital adverse events, and are the leading cause of medical malpractice claims [<xref ref-type="bibr" rid="ref7">7</xref>]. Considering the operative characteristics of clinical investigations combined with the inherent variability in disease presentation, it is often challenging to diagnose patients correctly&#x2014;an issue that has concerned physicians perennially. Decades ago, a pivotal study proposed that patient history contributes to approximately 80% of the diagnostic process [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. Medical history remains crucial for diagnosis [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>] and is vital in contemporary physicians&#x2019; clinical diagnoses.</p><p>With the advent of artificial intelligence (AI) in recent years, numerous studies have focused on AI-assisted diagnoses, including cancer screening and treatment [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref15">15</xref>], diagnostic ultrasound imaging [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref19">19</xref>], x-ray imaging [<xref ref-type="bibr" rid="ref20">20</xref>], computed tomography [<xref ref-type="bibr" rid="ref21">21</xref>], magnetic resonance imaging [<xref ref-type="bibr" rid="ref22">22</xref>], and endoscopy [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. Other reports on AI-assisted imaging diagnoses include AI&#x2019;s applications in radiology, pathology, and dermatological imaging [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. There have also been reports on the use of AI in diagnosing specific conditions [<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref27">27</xref>]. However, while several studies have reported that AI is useful in screening, diagnosing, and even treating certain medical conditions, to the best of our knowledge, no study has examined the importance of patient history in AI-assisted medical diagnosis. In addition, the extent to which AI considers patient history in its diagnostic processes remains to be fully understood.</p><p>This study aimed to investigate the importance of patient history in an AI-assisted medical diagnostic process aided by ChatGPT (version 4.0; June 2, 2023), one of the most well-known large language models that was released on March 14, 2023, to better understand the future of diagnostic medicine where AI is predicted to play an increasingly prominent role. Our study explored the contribution of patient history to AI-assisted medical diagnoses and assessed the accuracy of ChatGPT in reaching a clinical diagnosis based on the medical history that was provided. By reevaluating the significance of patient history, our study contributes to the ongoing discourse on optimizing diagnostic processes, both conventional and AI-assisted.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design, Settings, and Participants</title><p>In our study, we used some of the 45 standardized clinical vignettes in <italic>The BMJ</italic> (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) to evaluate the diagnostic and triage accuracy of web-based symptom checkers [<xref ref-type="bibr" rid="ref28">28</xref>]. These vignettes were published on June 5, 2015. They offer a balanced set of cases, with 15 cases requiring immediate attention, 15 cases requiring consultation but not immediately, and 15 cases not requiring immediate attention or consultation. They were identified from various clinical sources, including materials used to educate health professionals as well as a medical resource website, with content provided by a panel of physicians. Researchers have used these clinical vignettes to evaluate the usefulness of web-based symptom checkers and self-triage [<xref ref-type="bibr" rid="ref28">28</xref>-<xref ref-type="bibr" rid="ref31">31</xref>]. We chose these vignettes because of their varied severity levels, their origins from multiple resources rather than just 1 resource, and their credibility, having been used in prior studies. They also include some of the most commonly observed conditions in outpatient settings. Of the 45 cases, we selected those that included physical examination findings, test data, and medical history and provided a single distinct diagnosis. As illustrated in <xref ref-type="fig" rid="figure1">Figure 1</xref>, we excluded patients with no distinct diagnoses within the vignettes to serve as a reference (3 cases) and those who did not undergo any physical examination or laboratory tests (12 cases). Finally, the remaining 30 cases were used in this study.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Inclusion and exclusion criteria.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="mededu_v10i1e52674_fig01.png"/></fig></sec><sec id="s2-2"><title>Data Collection and Measurements</title><p>We assigned the correct diagnosis for each of these 30 cases to &#x201C;Answer.&#x201D; We then used the AI model, ChatGPT, to generate 2 diagnoses: the first, labeled &#x201C;History,&#x201D; was obtained by inputting only the medical history into ChatGPT; the second set, labeled &#x201C;All,&#x201D; was produced by inputting the medical history and all the other additional information in the clinical vignettes. Each time ChatGPT was prompted to generate a diagnosis, a separate chat window was used (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). Thus, we used 2 chat windows for each case&#x2014;one for the &#x201C;History&#x201D; diagnosis and the other for the &#x201C;All&#x201D; diagnosis. Additionally, the patients&#x2019; information was not inputted incrementally.</p><p>The concordance rate was assessed among &#x201C;Answer,&#x201D; &#x201C;History,&#x201D; and &#x201C;All.&#x201D; To extract a diagnosis from ChatGPT, we ended each input session with the phrase &#x201C;What is the most likely diagnosis?&#x201D; For both the &#x201C;History&#x201D; and &#x201C;All,&#x201D; the session was deemed complete when the AI returned the single most likely diagnosis. If ChatGPT suggested multiple diagnoses or indicated that it did not provide the most likely diagnosis, we repeated the process under the same conditions for a maximum of 5 attempts. Cases for which a single diagnosis could not be obtained even after 5 attempts were excluded without making further attempts.</p></sec><sec id="s2-3"><title>Ethical Considerations</title><p>Our research does not involve humans, medical records, patient information, observations of public behaviors, or secondary data analyses; hence, it is exempt from ethical approval, the requirement of informed consent, and institutional review board approval. Additionally, as no identifying information was included, the data did not need to be anonymized or deidentified, and the need for compensation did not arise because no human participants were included in the study.</p></sec><sec id="s2-4"><title>Data Analysis</title><p>Three board-certified physicians working in a medical diagnostic department at our facility assessed the concordance among the 3 AI-proposed diagnoses (&#x201C;Answer,&#x201D; &#x201C;History,&#x201D; and &#x201C;All&#x201D;). Of the 3 physicians, 1 is general medicine board&#x2013;certified, 1 is internal medicine board&#x2013;certified, and 1 is internal medicine&#x2013;, general internal medicine&#x2013;, and family medicine board&#x2013;certified; their postgraduate education spanned 7, 9, and 11 years, respectively. A diagnosis was considered to match if at least 2 of the 3 physicians agreed upon the correspondence. Distinguishing between acute pharyngitis and acute upper respiratory tract infection necessitated determining whether to consider diseases resulting from similar pathologies as correct diagnoses. In contrast, for diseases that are essentially the same but have different nomenclatures, such as oral ulcers and canker sores, we considered them correct diagnoses.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><p>Among the 30 cases, 19 patients were male and 11 were female, with ages ranging from 18 months to 65 years. In total, 12 individuals were younger than 20 years.</p><p>The results are shown in <xref ref-type="table" rid="table1">Table 1</xref>. Cases 1-15 of the original vignette represent those requiring emergent care, cases 16-30 represent those requiring nonemergent care, and cases 31-45 represent those that are appropriate for self-care. A comparison with the correct diagnosis listed in <italic>The BMJ</italic> vignettes (labeled as &#x201C;Answer&#x201D;) showed that &#x201C;Answer&#x201D; and &#x201C;History&#x201D; coincided 76.6% of the time, while &#x201C;Answer&#x201D; and &#x201C;All&#x201D; had a concordance rate of 93.3%. Five (16.7%) patients could not be diagnosed on the basis of medical history alone but were diagnosed when additional information was provided. In 1 (3.3%) case, the diagnosis was different and incorrect under both conditions (&#x201C;History&#x201D; and &#x201C;All&#x201D;). In 1 (3.3%) case, the incorrect diagnosis was the same under both conditions (&#x201C;History&#x201D; and &#x201C;All&#x201D;).</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>List of answers and diagnoses made by ChatGPT<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup>.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Case number of the original vignette</td><td align="left" valign="bottom">Original diagnosis (Answer)</td><td align="left" valign="bottom">Output from history only (History)<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="bottom">Output from all information (All)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td></tr></thead><tbody><tr><td align="left" valign="top">1</td><td align="left" valign="top">Acute liver failure</td><td align="left" valign="top">Acute liver failure<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Acute liver failure<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">2</td><td align="left" valign="top">Appendicitis</td><td align="left" valign="top">Acute gastroenteritis</td><td align="left" valign="top">Acute peritonitis, possibly secondary to a ruptured appendix (perforated appendicitis)<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">5</td><td align="left" valign="top">Deep vein thrombosis</td><td align="left" valign="top">Deep vein thrombosis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Deep vein thrombosis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">6</td><td align="left" valign="top">Heart attack</td><td align="left" valign="top">Acute myocardial infarction<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Acute anterior wall myocardial infarction<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">7</td><td align="left" valign="top">Hemolytic uremic syndrome</td><td align="left" valign="top">Hemolytic uremic syndrome<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Hemolytic uremic syndrome<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">9</td><td align="left" valign="top">Malaria</td><td align="left" valign="top">Malaria<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Malaria<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">10</td><td align="left" valign="top">Meningitis</td><td align="left" valign="top">N/A<sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup> &#x00D7; 5<sup><xref ref-type="table-fn" rid="table1fn6">f</xref></sup></td><td align="left" valign="top">Meningitis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">11</td><td align="left" valign="top">Pneumonia</td><td align="left" valign="top">Community-acquired pneumonia<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Community-acquired pneumonia<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">12</td><td align="left" valign="top">Pulmonary embolism</td><td align="left" valign="top">Pulmonary embolism<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Pulmonary embolism<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">13</td><td align="left" valign="top">Rocky Mountain spotted fever</td><td align="left" valign="top">Tick-borne illness, such as Rocky Mountain spotted fever or ehrlichiosis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Rocky Mountain spotted fever<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">16</td><td align="left" valign="top">Acute otitis media</td><td align="left" valign="top">Viral upper respiratory tract infection</td><td align="left" valign="top">Acute otitis media<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">17</td><td align="left" valign="top">Acute pharyngitis</td><td align="left" valign="top">Strep throat<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Streptococcal pharyngitis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">18</td><td align="left" valign="top">Acute pharyngitis</td><td align="left" valign="top">Streptococcal pharyngitis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Streptococcal pharyngitis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">19</td><td align="left" valign="top">Acute sinusitis</td><td align="left" valign="top">Acute sinusitis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">N/A &#x00D7; 2<sup><xref ref-type="table-fn" rid="table1fn7">g</xref></sup>; acute bacterial sinusitis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">21</td><td align="left" valign="top">Cellulitis</td><td align="left" valign="top">N/A &#x00D7; 5</td><td align="left" valign="top">Cellulitis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">24</td><td align="left" valign="top">Mononucleosis</td><td align="left" valign="top">Infectious mononucleosis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Infectious mononucleosis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">25</td><td align="left" valign="top">Peptic ulcer disease</td><td align="left" valign="top">Peptic ulcer disease<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Peptic ulcer disease<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">26</td><td align="left" valign="top">Pneumonia</td><td align="left" valign="top">Pneumonia<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Community-acquired pneumonia<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">27</td><td align="left" valign="top"><italic>Salmonella</italic> infection</td><td align="left" valign="top"><italic>Campylobacter jejuni</italic> infection</td><td align="left" valign="top">Acute gastroenteritis, likely due to food poisoning</td></tr><tr><td align="left" valign="top">30</td><td align="left" valign="top">Vertigo</td><td align="left" valign="top">Benign paroxysmal positional vertigo<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Benign paroxysmal positional vertigo<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">31</td><td align="left" valign="top">Acute bronchitis</td><td align="left" valign="top">Acute bronchitis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Acute bronchitis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">32</td><td align="left" valign="top">Acute bronchitis</td><td align="left" valign="top">Acute bronchitis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Acute bronchitis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">33</td><td align="left" valign="top">Acute conjunctivitis</td><td align="left" valign="top">Viral conjunctivitis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Viral conjunctivitis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">34</td><td align="left" valign="top">Acute pharyngitis</td><td align="left" valign="top">Viral upper respiratory tract infection</td><td align="left" valign="top">Upper respiratory tract infection</td></tr><tr><td align="left" valign="top">37</td><td align="left" valign="top">Bee sting without anaphylaxis</td><td align="left" valign="top">Pain of the sting</td><td align="left" valign="top">Localized allergic reaction to a bee sting<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">38</td><td align="left" valign="top">Canker sore</td><td align="left" valign="top">Recurrent aphthous stomatitis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Recurrent aphthous stomatitis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">39</td><td align="left" valign="top">Candida yeast infection</td><td align="left" valign="top">Vaginal candidiasis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Vulvovaginal candidiasis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">42</td><td align="left" valign="top">Stye</td><td align="left" valign="top">Hordeolum<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Hordeolum<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">43</td><td align="left" valign="top">Viral upper respiratory tract infection</td><td align="left" valign="top">Acute sinusitis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Acute sinusitis<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr><tr><td align="left" valign="top">44</td><td align="left" valign="top">Viral upper respiratory tract infection</td><td align="left" valign="top">Common viral illness, such as the common cold or influenza<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">Viral upper respiratory tract infection<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>We repeated outputs until a single plausible diagnosis was made, with a maximum of 5 attempts.</p></fn><fn id="table1fn2"><p><sup>b</sup>Matching answers between Answer and History: 23/30 (76.6%); median trial count 1 (Q1 1, Q2 1, Q3 1).</p></fn><fn id="table1fn3"><p><sup>c</sup>Matching answers between History and All: 28/30 (93.3%); median trial count 1 (Q1 1, Q2 1, Q3 1).</p></fn><fn id="table1fn4"><p><sup>d</sup>The output matched with that of &#x201C;Answer.&#x201D;</p></fn><fn id="table1fn5"><p><sup>e</sup>N/A: not applicable.</p></fn><fn id="table1fn6"><p><sup>f</sup>We attempted to obtain a diagnosis 5 times but failed.</p></fn><fn id="table1fn7"><p><sup>g</sup>We attempted to obtain a diagnosis twice but failed.</p></fn></table-wrap-foot></table-wrap><p><xref ref-type="fig" rid="figure2">Figure 2</xref> presents details regarding the number of attempts required. On average, 1.27 attempts were needed for inputs involving only medical history followed by the question &#x201C;What is the most likely diagnosis?&#x201D; When all possible information, including physical examination findings and laboratory data, were inputted, followed by the same question, an average of 1.00 attempt was required. Regarding the 2 cases shown in <xref ref-type="fig" rid="figure2">Figure 2</xref> that required 5 attempts, ChatGPT was unable to narrow down the diagnosis to the single most likely option. Consequently, these cases were counted as mismatches with the correct diagnoses listed in <italic>The BMJ</italic> vignettes.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Data collection and measurements.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="mededu_v10i1e52674_fig02.png"/></fig></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>Despite the advancements in medical knowledge and diagnostic techniques, misdiagnosis remains a significant issue. AI has shown promise in the diagnosis and treatment of medical conditions; however, there is limited understanding of how AI uses patient history for diagnostic purposes. Our study aimed to investigate the extent to which AI (ChatGPT) can use information from medical history to accurately diagnose common diseases, which are frequently encountered in general outpatient, emergency, and ward management settings. Although some studies have investigated the accuracy of AI-based medical diagnosis, our study is novel because it emphasizes the importance of patient history. We compared the diagnostic accuracy of diagnoses made on the basis of only patient history and those made using all the information; this makes our study unique. To the best of our knowledge, no previous research has been conducted on this topic.</p><p>Our study investigated the role of patient history in AI-assisted medical diagnoses using ChatGPT. We analyzed 30 standardized patient vignettes from <italic>The BMJ</italic> to assess the concordance rates between AI-proposed diagnoses based on medical history only and those based on both medical history and additional information. Our results showed high concordance rates of 76.6% between the &#x201C;Answer&#x201D; and &#x201C;History&#x201D; groups, suggesting the importance of patient history in AI-assisted diagnoses and highlighting the potential of AI in improving diagnostic accuracy. This result is similar to that of a previous study that involved actual physicians instead of ChatGPT [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>].</p><p>Characteristics of cases that did not lead to appropriate diagnoses based on history alone include, for instance, the following: an appendicitis case (case 2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) for which there was no documentation of pain migration in the medical history, a meningitis case (case 10 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) wherein only headache and fever were documented, an otitis media case (case 16 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) wherein only upper respiratory symptoms were recorded with no mention of ear-related symptoms, errors in identifying the causative agent in a case of acute gastroenteritis (case 27 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), and an acute pharyngitis case (case 34 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) that lacked the necessary medical history to determine the Centor score. Such omissions in the medical history could be considered contributing factors to the misdiagnoses. When physical findings and test data were added, an accurate diagnosis was achieved in 28 out of 30 cases (93.3%), showing a 16.7% increase in the accuracy rate. These two cases were of acute pharyngitis diagnosed as acute upper respiratory tract infection and <italic>Salmonella</italic> enteritis diagnosed as acute gastroenteritis. While we considered these incorrect diagnoses for the purpose of this study, they could have been deemed correct under certain criteria. Of the 7 cases that did not match between &#x201C;Answer&#x201D; and &#x201C;History,&#x201D; 6 were of infectious diseases (21 of 30 cases were of infectious diseases). These included cases where appendicitis was mistaken for acute gastroenteritis, acute otitis media and acute pharyngitis were mistaken for upper respiratory infections, and a <italic>Salmonella</italic> infection was mistaken for a <italic>Campylobacter</italic> infection. Physical examinations or tests may help identify the site of infection or pathogen in cases of intra-abdominal or head and neck infections.</p><p>There are situations in which physical examination and clinical test information may not be available in clinical settings. For instance, digital patient encounters owing to the impact of the COVID-19 pandemic often preclude physical examinations and clinical tests. The widespread use of telemedicine approaches in COVID-19 management, from screening to follow-up, has demonstrated the community&#x2019;s acceptance and interest in telehealth solutions [<xref ref-type="bibr" rid="ref32">32</xref>]. Moreover, even in face-to-face consultations, there are scenarios, such as in clinics, where detailed clinical tests may not be feasible depending on the setting. Furthermore, we cannot perform all physical examinations and tests on all patients. Therefore, we should consider potential differential diagnoses and decide which pertinent physical examinations or tests are the most suitable and should be performed. Most importantly, it has been reported that one rarely makes a correct diagnosis when one cannot make a differential diagnosis based on history [<xref ref-type="bibr" rid="ref11">11</xref>]. In addition, accurately predicting the diagnosis based on medical history is associated with a higher diagnostic accuracy of the physical examination, whereas incorrect prediction of the diagnosis based on medical history is associated with a lower diagnostic accuracy of the physical examination [<xref ref-type="bibr" rid="ref33">33</xref>]. Based on these findings and suggestions, medical diagnosis using ChatGPT is considered heavily dependent on history.</p><p>Using AI for diagnosis can enhance diagnostic accuracy by more efficiently collecting medical histories. For instance, diagnosing acute appendicitis is sometimes challenging. AI may face the same challenge as that observed when, in our study, AI mistakenly identified acute appendicitis as acute gastroenteritis. This misdiagnosis may have occurred because the case lacked specific medical histories characteristic of appendicitis, such as pain migration. By configuring AI systems to verify pain migration in patients with abdominal pain, especially for such common conditions, diagnostic precision may improve.</p><p>There are 2 possible limitations in our study. First, it remains unclear whether similar results could be obtained with other vignettes or actual patients. Unlike using preprovided vignettes, among which we included 30 cases, diagnosis can be more challenging in clinical settings because it requires taking a medical history from patients. We included 30 cases from among the vignettes, which include some of the most commonly observed conditions in the outpatient setting. Although covering all the existing conditions is not feasible, we do not know if the case volume in our study is sufficiently high. This study included relatively simple cases in which patients had very few comorbidities, potentially making the diagnosis less challenging. Moreover, patients with psychiatric conditions tend to present with complex and lengthy case histories, and the wording used by mental health clinicians may differ, be inconsistent, be vague, or fail to pinpoint a diagnosis. Our vignettes did not include a diagnosis of any mental illness. Due to the abovementioned reasons, our results may not apply to all clinical settings. Furthermore, when we consider what the patient reports, results may differ if languages other than English are used since ChatGPT does not recognize some languages, and each language may have its unique nuance. This highlights the importance of linguistic diversity and cultural context in AI applications, particularly in medical diagnoses where patient communication and history are critical. Future iterations of AI systems should aim to incorporate a broader range of languages and understand cultural nuances to ensure more accurate and inclusive diagnostic support. This idea is important in the context of health inequality. Furthermore, disparities in technology access may pose some challenges. Future research should address these barriers to ensure equitable access to AI-assisted diagnostic tools.</p><p>Second, we encountered cases where the input of medical history followed by the question, &#x201C;What is the most likely diagnosis?&#x201D; failed to yield a single most likely diagnosis even after 5 attempts, which could have introduced bias into our results, although we only had 2 such cases.</p><p>In the future, studies should focus on training AI by implementing evidence-based medical information, enabling it to present the underlying reasons and guidelines for diagnoses. In the event of a misdiagnosis, analyzing the process that led to the false diagnosis could be challenging in an AI-assisted medical diagnosis. Given the current situation where reflection on misdiagnoses is not always feasible, AI should be used as an auxiliary tool in medical diagnosis. This approach underscores the importance of AI, deeming it a support system rather than a definitive diagnostic solution. This area needs further investigation. Future studies should also verify our results with certain common conditions or diseases, such as the top 10 diseases identified in the Global Burden of Diseases study [<xref ref-type="bibr" rid="ref34">34</xref>], potentially leveraging the benefits and limitations of AI-assisted medical diagnosis.</p></sec><sec id="s4-2"><title>Conclusions</title><p>Relevant patient history is essential for AI-assisted diagnosis. The input of relevant patient history or the development of AI systems capable of obtaining comprehensive medical histories is vital for AI-assisted medical diagnosis. Furthermore, even in the modern era of advanced medical knowledge and clinical testing, the significance of patient history in diagnosis remains crucial.</p></sec></sec></body><back><notes><sec><title>Data Availability</title><p>All of our clinical vignettes, results, and prompts used are provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec></notes><fn-group><fn fn-type="con"><p>FF conceptualized the study, designed the methodology, collected the data, and drafted the manuscript. YY, DY, and SU conceptualized the study, designed the methodology, and reviewed and edited the manuscript. SY, YL, KS, TT, KN, TU, and MI conceptualized the study and reviewed and edited the manuscript. No generative artificial intelligence was used in writing the manuscript.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Omron</surname><given-names>R</given-names></name><name name-style="western"><surname>Kotwal</surname><given-names>S</given-names></name><name name-style="western"><surname>Garibaldi</surname><given-names>BT</given-names></name><name name-style="western"><surname>Newman-Toker</surname><given-names>DE</given-names></name></person-group><article-title>The diagnostic performance feedback &#x201C;calibration gap&#x201D;: why clinical experience alone is not enough to prevent serious diagnostic errors</article-title><source>AEM Educ Train</source><year>2018</year><month>10</month><volume>2</volume><issue>4</issue><fpage>339</fpage><lpage>342</lpage><pub-id pub-id-type="doi">10.1002/aet2.10119</pub-id><pub-id pub-id-type="medline">30386846</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="book"><person-group person-group-type="author"><collab>Committee on Diagnostic Error in Health Care</collab><collab>Board on Health Care Services</collab><collab>Institute of Medicine</collab><collab>The National Academies of Sciences, Engineering, and Medicine</collab></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Balogh</surname><given-names>EP</given-names></name><name name-style="western"><surname>Miller</surname><given-names>BT</given-names></name><name name-style="western"><surname>Ball</surname><given-names>JR</given-names></name></person-group><source>Improving Diagnosis in Health Care</source><year>2015</year><publisher-name>National Academies Press</publisher-name><pub-id pub-id-type="other">9780309377720</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Friberg</surname><given-names>N</given-names></name><name name-style="western"><surname>Ljungberg</surname><given-names>O</given-names></name><name name-style="western"><surname>Berglund</surname><given-names>E</given-names></name><etal/></person-group><article-title>Cause of death and significant disease found at autopsy</article-title><source>Virchows Arch</source><year>2019</year><month>12</month><volume>475</volume><issue>6</issue><fpage>781</fpage><lpage>788</lpage><pub-id pub-id-type="doi">10.1007/s00428-019-02672-z</pub-id><pub-id pub-id-type="medline">31691009</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shojania</surname><given-names>KG</given-names></name><name name-style="western"><surname>Burton</surname><given-names>EC</given-names></name><name name-style="western"><surname>McDonald</surname><given-names>KM</given-names></name><name name-style="western"><surname>Goldman</surname><given-names>L</given-names></name></person-group><article-title>Changes in rates of autopsy-detected diagnostic errors over time: a systematic review</article-title><source>JAMA</source><year>2003</year><month>06</month><day>4</day><volume>289</volume><issue>21</issue><fpage>2849</fpage><lpage>2856</lpage><pub-id pub-id-type="doi">10.1001/jama.289.21.2849</pub-id><pub-id pub-id-type="medline">12783916</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schmitt</surname><given-names>BP</given-names></name><name name-style="western"><surname>Kushner</surname><given-names>MS</given-names></name><name name-style="western"><surname>Wiener</surname><given-names>SL</given-names></name></person-group><article-title>The diagnostic usefulness of the history of the patient with dyspnea</article-title><source>J Gen Intern Med</source><year>1986</year><volume>1</volume><issue>6</issue><fpage>386</fpage><lpage>393</lpage><pub-id pub-id-type="doi">10.1007/BF02596424</pub-id><pub-id pub-id-type="medline">3794838</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kuijpers</surname><given-names>C</given-names></name><name name-style="western"><surname>Fronczek</surname><given-names>J</given-names></name><name name-style="western"><surname>van de Goot</surname><given-names>FRW</given-names></name><name name-style="western"><surname>Niessen</surname><given-names>HWM</given-names></name><name name-style="western"><surname>van Diest</surname><given-names>PJ</given-names></name><name name-style="western"><surname>Jiwa</surname><given-names>M</given-names></name></person-group><article-title>The value of autopsies in the era of high-tech medicine: discrepant findings persist</article-title><source>J Clin Pathol</source><year>2014</year><month>06</month><volume>67</volume><issue>6</issue><fpage>512</fpage><lpage>519</lpage><pub-id pub-id-type="doi">10.1136/jclinpath-2013-202122</pub-id><pub-id pub-id-type="medline">24596140</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ball</surname><given-names>JR</given-names></name><name name-style="western"><surname>Balogh</surname><given-names>E</given-names></name></person-group><article-title>Improving diagnosis in health care: highlights of a report from the National Academies of Sciences, Engineering, and Medicine</article-title><source>Ann Intern Med</source><year>2016</year><month>01</month><day>5</day><volume>164</volume><issue>1</issue><fpage>59</fpage><lpage>61</lpage><pub-id pub-id-type="doi">10.7326/M15-2256</pub-id><pub-id pub-id-type="medline">26414299</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Winters</surname><given-names>B</given-names></name><name name-style="western"><surname>Custer</surname><given-names>J</given-names></name><name name-style="western"><surname>Galvagno</surname><given-names>SM</given-names></name><etal/></person-group><article-title>Diagnostic errors in the intensive care unit: a systematic review of autopsy studies</article-title><source>BMJ Qual Saf</source><year>2012</year><month>11</month><volume>21</volume><issue>11</issue><fpage>894</fpage><lpage>902</lpage><pub-id pub-id-type="doi">10.1136/bmjqs-2012-000803</pub-id><pub-id pub-id-type="medline">22822241</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hampton</surname><given-names>JR</given-names></name><name name-style="western"><surname>Harrison</surname><given-names>MJ</given-names></name><name name-style="western"><surname>Mitchell</surname><given-names>JR</given-names></name><name name-style="western"><surname>Prichard</surname><given-names>JS</given-names></name><name name-style="western"><surname>Seymour</surname><given-names>C</given-names></name></person-group><article-title>Relative contributions of history-taking, physical examination, and laboratory investigation to diagnosis and management of medical outpatients</article-title><source>Br Med J</source><year>1975</year><month>05</month><day>31</day><volume>2</volume><issue>5969</issue><fpage>486</fpage><lpage>489</lpage><pub-id pub-id-type="doi">10.1136/bmj.2.5969.486</pub-id><pub-id pub-id-type="medline">1148666</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Peterson</surname><given-names>MC</given-names></name><name name-style="western"><surname>Holbrook</surname><given-names>JM</given-names></name><name name-style="western"><surname>Hales</surname><given-names>DV</given-names></name><name name-style="western"><surname>Smith</surname><given-names>NL</given-names></name><name name-style="western"><surname>Staker</surname><given-names>LV</given-names></name></person-group><article-title>Contributions of the history, physical examination, and laboratory investigation in making medical diagnoses</article-title><source>Obstet Gynecol Surv</source><year>1992</year><month>10</month><volume>47</volume><issue>10</issue><fpage>711</fpage><lpage>712</lpage><pub-id pub-id-type="doi">10.1097/00006254-199210000-00013</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gruppen</surname><given-names>LD</given-names></name><name name-style="western"><surname>Palchik</surname><given-names>NS</given-names></name><name name-style="western"><surname>Wolf</surname><given-names>FM</given-names></name><name name-style="western"><surname>Laing</surname><given-names>TJ</given-names></name><name name-style="western"><surname>Oh</surname><given-names>MS</given-names></name><name name-style="western"><surname>Davis</surname><given-names>WK</given-names></name></person-group><article-title>Medical student use of history and physical information in diagnostic reasoning</article-title><source>Arthritis Care Res</source><year>1993</year><month>06</month><volume>6</volume><issue>2</issue><fpage>64</fpage><lpage>70</lpage><pub-id pub-id-type="doi">10.1002/art.1790060204</pub-id><pub-id pub-id-type="medline">8399428</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tsukamoto</surname><given-names>T</given-names></name><name name-style="western"><surname>Ohira</surname><given-names>Y</given-names></name><name name-style="western"><surname>Noda</surname><given-names>K</given-names></name><name name-style="western"><surname>Takada</surname><given-names>T</given-names></name><name name-style="western"><surname>Ikusaka</surname><given-names>M</given-names></name></person-group><article-title>The contribution of the medical history for the diagnosis of simulated cases by medical students</article-title><source>Int J Med Educ</source><year>2012</year><month>04</month><volume>3</volume><fpage>78</fpage><lpage>82</lpage><pub-id pub-id-type="doi">10.5116/ijme.4f8a.e48c</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>ZH</given-names></name><name name-style="western"><surname>Lin</surname><given-names>L</given-names></name><name name-style="western"><surname>Wu</surname><given-names>CF</given-names></name><name name-style="western"><surname>Li</surname><given-names>CF</given-names></name><name name-style="western"><surname>Xu</surname><given-names>RH</given-names></name><name name-style="western"><surname>Sun</surname><given-names>Y</given-names></name></person-group><article-title>Artificial intelligence for assisting cancer diagnosis and treatment in the era of precision medicine</article-title><source>Cancer Commun (Lond)</source><year>2021</year><month>11</month><volume>41</volume><issue>11</issue><fpage>1100</fpage><lpage>1115</lpage><pub-id pub-id-type="doi">10.1002/cac2.12215</pub-id><pub-id pub-id-type="medline">34613667</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mitsala</surname><given-names>A</given-names></name><name name-style="western"><surname>Tsalikidis</surname><given-names>C</given-names></name><name name-style="western"><surname>Pitiakoudis</surname><given-names>M</given-names></name><name name-style="western"><surname>Simopoulos</surname><given-names>C</given-names></name><name name-style="western"><surname>Tsaroucha</surname><given-names>AK</given-names></name></person-group><article-title>Artificial intelligence in colorectal cancer screening, diagnosis and treatment. A new era</article-title><source>Curr Oncol</source><year>2021</year><month>04</month><day>23</day><volume>28</volume><issue>3</issue><fpage>1581</fpage><lpage>1607</lpage><pub-id pub-id-type="doi">10.3390/curroncol28030149</pub-id><pub-id pub-id-type="medline">33922402</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ochiai</surname><given-names>K</given-names></name><name name-style="western"><surname>Ozawa</surname><given-names>T</given-names></name><name name-style="western"><surname>Shibata</surname><given-names>J</given-names></name><name name-style="western"><surname>Ishihara</surname><given-names>S</given-names></name><name name-style="western"><surname>Tada</surname><given-names>T</given-names></name></person-group><article-title>Current status of artificial intelligence-based computer-assisted diagnosis systems for gastric cancer in endoscopy</article-title><source>Diagnostics (Basel)</source><year>2022</year><month>12</month><day>13</day><volume>12</volume><issue>12</issue><fpage>3153</fpage><pub-id pub-id-type="doi">10.3390/diagnostics12123153</pub-id><pub-id pub-id-type="medline">36553160</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Calisto</surname><given-names>FM</given-names></name><name name-style="western"><surname>Santiago</surname><given-names>C</given-names></name><name name-style="western"><surname>Nunes</surname><given-names>N</given-names></name><name name-style="western"><surname>Nascimento</surname><given-names>JC</given-names></name></person-group><article-title>Breastscreening-AI: evaluating medical intelligent agents for human-AI interactions</article-title><source>Artif Intell Med</source><year>2022</year><month>05</month><volume>127</volume><fpage>102285</fpage><pub-id pub-id-type="doi">10.1016/j.artmed.2022.102285</pub-id><pub-id pub-id-type="medline">35430044</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhou</surname><given-names>LQ</given-names></name><name name-style="western"><surname>Wang</surname><given-names>JY</given-names></name><name name-style="western"><surname>Yu</surname><given-names>SY</given-names></name><etal/></person-group><article-title>Artificial intelligence in medical imaging of the liver</article-title><source>World J Gastroenterol</source><year>2019</year><month>02</month><day>14</day><volume>25</volume><issue>6</issue><fpage>672</fpage><lpage>682</lpage><pub-id pub-id-type="doi">10.3748/wjg.v25.i6.672</pub-id><pub-id pub-id-type="medline">30783371</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Peng</surname><given-names>S</given-names></name><name name-style="western"><surname>Liu</surname><given-names>Y</given-names></name><name name-style="western"><surname>Lv</surname><given-names>W</given-names></name><etal/></person-group><article-title>Deep learning-based artificial intelligence model to assist thyroid nodule diagnosis and management: a multicentre diagnostic study</article-title><source>Lancet Digit Health</source><year>2021</year><month>04</month><volume>3</volume><issue>4</issue><fpage>e250</fpage><lpage>e259</lpage><pub-id pub-id-type="doi">10.1016/S2589-7500(21)00041-8</pub-id><pub-id pub-id-type="medline">33766289</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Drukker</surname><given-names>L</given-names></name><name name-style="western"><surname>Noble</surname><given-names>JA</given-names></name><name name-style="western"><surname>Papageorghiou</surname><given-names>AT</given-names></name></person-group><article-title>Introduction to artificial intelligence in ultrasound imaging in obstetrics and gynecology</article-title><source>Ultrasound Obstet Gynecol</source><year>2020</year><month>10</month><volume>56</volume><issue>4</issue><fpage>498</fpage><lpage>505</lpage><pub-id pub-id-type="doi">10.1002/uog.22122</pub-id><pub-id pub-id-type="medline">32530098</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Guermazi</surname><given-names>A</given-names></name><name name-style="western"><surname>Tannoury</surname><given-names>C</given-names></name><name name-style="western"><surname>Kompel</surname><given-names>AJ</given-names></name><etal/></person-group><article-title>Improving radiographic fracture recognition performance and efficiency using artificial intelligence</article-title><source>Radiology</source><year>2022</year><month>03</month><volume>302</volume><issue>3</issue><fpage>627</fpage><lpage>636</lpage><pub-id pub-id-type="doi">10.1148/radiol.210937</pub-id><pub-id pub-id-type="medline">34931859</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>K</given-names></name><name name-style="western"><surname>Liu</surname><given-names>X</given-names></name><name name-style="western"><surname>Shen</surname><given-names>J</given-names></name><etal/></person-group><article-title>Clinically applicable AI system for accurate diagnosis, quantitative measurements, and prognosis of COVID-19 pneumonia using computed tomography</article-title><source>Cell</source><year>2020</year><month>06</month><day>11</day><volume>181</volume><issue>6</issue><fpage>1423</fpage><lpage>1433</lpage><pub-id pub-id-type="doi">10.1016/j.cell.2020.04.045</pub-id><pub-id pub-id-type="medline">32416069</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gore</surname><given-names>JC</given-names></name></person-group><article-title>Artificial intelligence in medical imaging</article-title><source>Magn Reson Imaging</source><year>2020</year><month>05</month><volume>68</volume><fpage>A1</fpage><lpage>A4</lpage><pub-id pub-id-type="doi">10.1016/j.mri.2019.12.006</pub-id><pub-id pub-id-type="medline">31857130</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Okagawa</surname><given-names>Y</given-names></name><name name-style="western"><surname>Abe</surname><given-names>S</given-names></name><name name-style="western"><surname>Yamada</surname><given-names>M</given-names></name><name name-style="western"><surname>Oda</surname><given-names>I</given-names></name><name name-style="western"><surname>Saito</surname><given-names>Y</given-names></name></person-group><article-title>Artificial intelligence in endoscopy</article-title><source>Dig Dis Sci</source><year>2022</year><month>05</month><volume>67</volume><issue>5</issue><fpage>1553</fpage><lpage>1572</lpage><pub-id pub-id-type="doi">10.1007/s10620-021-07086-z</pub-id><pub-id pub-id-type="medline">34155567</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ramesh</surname><given-names>AN</given-names></name><name name-style="western"><surname>Kambhampati</surname><given-names>C</given-names></name><name name-style="western"><surname>Monson</surname><given-names>JRT</given-names></name><name name-style="western"><surname>Drew</surname><given-names>PJ</given-names></name></person-group><article-title>Artificial intelligence in medicine</article-title><source>Ann R Coll Surg Engl</source><year>2004</year><month>09</month><volume>86</volume><issue>5</issue><fpage>334</fpage><lpage>338</lpage><pub-id pub-id-type="doi">10.1308/147870804290</pub-id><pub-id pub-id-type="medline">15333167</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Revilla-Le&#x00F3;n</surname><given-names>M</given-names></name><name name-style="western"><surname>G&#x00F3;mez-Polo</surname><given-names>M</given-names></name><name name-style="western"><surname>Barmak</surname><given-names>AB</given-names></name><etal/></person-group><article-title>Artificial intelligence models for diagnosing gingivitis and periodontal disease: a systematic review</article-title><source>J Prosthet Dent</source><year>2023</year><month>12</month><volume>130</volume><issue>6</issue><fpage>816</fpage><lpage>824</lpage><pub-id pub-id-type="doi">10.1016/j.prosdent.2022.01.026</pub-id><pub-id pub-id-type="medline">35300850</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chung</surname><given-names>H</given-names></name><name name-style="western"><surname>Jo</surname><given-names>Y</given-names></name><name name-style="western"><surname>Ryu</surname><given-names>D</given-names></name><name name-style="western"><surname>Jeong</surname><given-names>C</given-names></name><name name-style="western"><surname>Choe</surname><given-names>SK</given-names></name><name name-style="western"><surname>Lee</surname><given-names>J</given-names></name></person-group><article-title>Artificial-intelligence-driven discovery of prognostic biomarker for sarcopenia</article-title><source>J Cachexia Sarcopenia Muscle</source><year>2021</year><month>12</month><volume>12</volume><issue>6</issue><fpage>2220</fpage><lpage>2230</lpage><pub-id pub-id-type="doi">10.1002/jcsm.12840</pub-id><pub-id pub-id-type="medline">34704369</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Uzun Ozsahin</surname><given-names>D</given-names></name><name name-style="western"><surname>Ozgocmen</surname><given-names>C</given-names></name><name name-style="western"><surname>Balcioglu</surname><given-names>O</given-names></name><name name-style="western"><surname>Ozsahin</surname><given-names>I</given-names></name><name name-style="western"><surname>Uzun</surname><given-names>B</given-names></name></person-group><article-title>Diagnostic AI and cardiac diseases</article-title><source>Diagnostics (Basel)</source><year>2022</year><month>11</month><day>22</day><volume>12</volume><issue>12</issue><fpage>2901</fpage><pub-id pub-id-type="doi">10.3390/diagnostics12122901</pub-id><pub-id pub-id-type="medline">36552908</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Semigran</surname><given-names>HL</given-names></name><name name-style="western"><surname>Linder</surname><given-names>JA</given-names></name><name name-style="western"><surname>Gidengil</surname><given-names>C</given-names></name><name name-style="western"><surname>Mehrotra</surname><given-names>A</given-names></name></person-group><article-title>Evaluation of symptom checkers for self diagnosis and triage: audit study</article-title><source>BMJ</source><year>2015</year><month>07</month><day>8</day><volume>351</volume><fpage>h3480</fpage><pub-id pub-id-type="doi">10.1136/bmj.h3480</pub-id><pub-id pub-id-type="medline">26157077</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>North</surname><given-names>F</given-names></name><name name-style="western"><surname>Jensen</surname><given-names>TB</given-names></name><name name-style="western"><surname>Stroebel</surname><given-names>RJ</given-names></name><etal/></person-group><article-title>Self-triage use, subsequent healthcare utilization, and diagnoses: a retrospective study of process and clinical outcomes following self-triage and self-scheduling for ear or hearing symptoms</article-title><source>Health Serv Res Manag Epidemiol</source><year>2023</year><volume>10</volume><fpage>23333928231168121</fpage><pub-id pub-id-type="doi">10.1177/23333928231168121</pub-id><pub-id pub-id-type="medline">37101803</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Riboli-Sasco</surname><given-names>E</given-names></name><name name-style="western"><surname>El-Osta</surname><given-names>A</given-names></name><name name-style="western"><surname>Alaa</surname><given-names>A</given-names></name><etal/></person-group><article-title>Triage and diagnostic accuracy of online symptom checkers: systematic review</article-title><source>J Med Internet Res</source><year>2023</year><month>06</month><day>2</day><volume>25</volume><fpage>e43803</fpage><pub-id pub-id-type="doi">10.2196/43803</pub-id><pub-id pub-id-type="medline">37266983</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Radionova</surname><given-names>N</given-names></name><name name-style="western"><surname>&#x00D6;g</surname><given-names>E</given-names></name><name name-style="western"><surname>Wetzel</surname><given-names>AJ</given-names></name><name name-style="western"><surname>Rieger</surname><given-names>MA</given-names></name><name name-style="western"><surname>Preiser</surname><given-names>C</given-names></name></person-group><article-title>Impacts of symptom checkers for laypersons&#x2019; self-diagnosis on physicians in primary care: scoping review</article-title><source>J Med Internet Res</source><year>2023</year><month>05</month><day>29</day><volume>25</volume><fpage>e39219</fpage><pub-id pub-id-type="doi">10.2196/39219</pub-id><pub-id pub-id-type="medline">37247214</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Khoshrounejad</surname><given-names>F</given-names></name><name name-style="western"><surname>Hamednia</surname><given-names>M</given-names></name><name name-style="western"><surname>Mehrjerd</surname><given-names>A</given-names></name><etal/></person-group><article-title>Telehealth-based services during the COVID-19 pandemic: a systematic review of features and challenges</article-title><source>Front Public Health</source><year>2021</year><volume>9</volume><fpage>711762</fpage><pub-id pub-id-type="doi">10.3389/fpubh.2021.711762</pub-id><pub-id pub-id-type="medline">34350154</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shikino</surname><given-names>K</given-names></name><name name-style="western"><surname>Ikusaka</surname><given-names>M</given-names></name><name name-style="western"><surname>Ohira</surname><given-names>Y</given-names></name><etal/></person-group><article-title>Influence of predicting the diagnosis from history on the accuracy of physical examination</article-title><source>Adv Med Educ Pract</source><year>2015</year><volume>6</volume><fpage>143</fpage><lpage>148</lpage><pub-id pub-id-type="doi">10.2147/AMEP.S77315</pub-id><pub-id pub-id-type="medline">25759604</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>GBD 2019 Diseases and Injuries Collaborators</collab></person-group><article-title>Global burden of 369 diseases and injuries in 204 countries and territories, 1990-2019: a systematic analysis for the Global Burden of Disease Study 2019</article-title><source>Lancet</source><year>2020</year><month>10</month><day>17</day><volume>396</volume><issue>10258</issue><fpage>1204</fpage><lpage>1222</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(20)30925-9</pub-id><pub-id pub-id-type="medline">33069326</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Clinical Vignettes used in our study.</p><media xlink:href="mededu_v10i1e52674_app1.pdf" xlink:title="PDF File, 159 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Explanation of the prompts we used in our study.</p><media xlink:href="mededu_v10i1e52674_app2.pdf" xlink:title="PDF File, 48 KB"/></supplementary-material></app-group></back></article>