<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Med Educ</journal-id><journal-id journal-id-type="publisher-id">mededu</journal-id><journal-id journal-id-type="index">20</journal-id><journal-title>JMIR Medical Education</journal-title><abbrev-journal-title>JMIR Med Educ</abbrev-journal-title><issn pub-type="epub">2369-3762</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v11i1e82326</article-id><article-id pub-id-type="doi">10.2196/82326</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Quantifying Emergency Medicine Residency Learning Curves Using Natural Language Processing: Retrospective Cohort Study</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Preiksaitis</surname><given-names>Carl</given-names></name><degrees>MD, MEd</degrees><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><name name-style="western"><surname>Hughes</surname><given-names>Joshua</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kabeer</surname><given-names>Rana</given-names></name><degrees>MD, MPH</degrees><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><name name-style="western"><surname>Dixon</surname><given-names>William</given-names></name><degrees>MD, MSED</degrees><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><name name-style="western"><surname>Rose</surname><given-names>Christian</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1"/></contrib></contrib-group><aff id="aff1"><institution>Department of Emergency Medicine, Stanford University School of Medicine</institution><addr-line>900 Welch Road, Suite 350</addr-line><addr-line>Palo Alto</addr-line><addr-line>CA</addr-line><country>United States</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Pellegrino</surname><given-names>Raffaele</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Chartash</surname><given-names>David</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Yao</surname><given-names>Li-Hung</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Carl Preiksaitis, MD, MEd, Department of Emergency Medicine, Stanford University School of Medicine, 900 Welch Road, Suite 350, Palo Alto, CA, 94304, United States, 1 650-723-6576, 1 650-723-0121; <email>cpreiksaitis@stanford.edu</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>9</day><month>12</month><year>2025</year></pub-date><volume>11</volume><elocation-id>e82326</elocation-id><history><date date-type="received"><day>13</day><month>08</month><year>2025</year></date><date date-type="rev-recd"><day>10</day><month>10</month><year>2025</year></date><date date-type="accepted"><day>09</day><month>11</month><year>2025</year></date></history><copyright-statement>&#x00A9; Carl Preiksaitis, Joshua Hughes, Rana Kabeer, William Dixon, Christian Rose. Originally published in JMIR Medical Education (<ext-link ext-link-type="uri" xlink:href="https://mededu.jmir.org">https://mededu.jmir.org</ext-link>), 9.12.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Education, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://mededu.jmir.org/">https://mededu.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://mededu.jmir.org/2025/1/e82326"/><abstract><sec><title>Background</title><p>The optimal duration of emergency medicine (EM) residency training remains a subject of national debate, with the Accreditation Council for Graduate Medical Education considering standardizing all programs to 4 years. However, empirical data on how residents accumulate clinical exposure over time are limited. Traditional measures, such as case logs and diagnostic codes, often fail to capture the breadth and depth of diagnostic reasoning. Natural language processing (NLP) of clinical documentation offers a novel approach to quantifying clinical experiences more comprehensively.</p></sec><sec><title>Objective</title><p>This study aimed to (1) quantify how EM residents acquire clinical topic exposure over the course of training, (2) evaluate variation in exposure patterns across residents and classes, and (3) assess changes in workload and case complexity over time to inform the discussion on optimal program length.</p></sec><sec sec-type="methods"><title>Methods</title><p>We conducted a retrospective cohort study of EM residents at Stanford Hospital, analyzing 244,255 emergency department encounters from July 1, 2016, to November 30, 2023. The sample included 62 residents across 4 graduating classes (2020&#x2010;2023), representing all primary training site encounters where residents served as primary or supervisory providers. Using a retrieval-augmented generation NLP pipeline, we mapped resident clinical documentation to the 895 subcategories of the 2022 Model for Clinical Practice of Emergency Medicine (MCPEM) via intermediate mapping to the Systematized Nomenclature of Medicine, Clinical Terms, Clinical Observations, Recordings, and Encoding problem list subset. We generated cumulative topic exposure curves, quantified the diversity of topic coverage, assessed variability between residents, and analyzed the progression in clinical complexity using Emergency Severity Index (ESI) scores and admission rates.</p></sec><sec sec-type="results"><title>Results</title><p>Residents encountered the largest increase in new topics during postgraduate year 1 (PGY1), averaging 376.7 (42.1%) unique topics among a total of 895 MCPEM subcategories. By PGY4, they averaged 565.9 (63.2%) topics, representing a 9.9% (51/515) increase over PGY3. Exposure plateaus generally occurred at 39 to 41 months, although substantial individual variation was observed, with some residents continuing to acquire new topics until graduation. Annual case volume more than tripled from PGY1 (mean 445.7, SD 112.7 encounters) to PGY4 (mean 1528.4, SD 112.7 encounters). Case complexity increased, as evidenced by a decrease in mean ESI score from 2.94 to 2.79, and a rise in high-acuity (ESI 1&#x2010;2) cases from 16% (4374/27,340) to 30.9% (9418/30,466).</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>NLP analysis of clinical documentation provides a scalable, detailed method for tracking EM residents&#x2019; clinical exposure and progression. Many residents continue to gain new experiences into their fourth year, particularly in higher-acuity cases. These findings suggest that a 4-year training model may offer meaningful additional educational value, while also highlighting the importance of individualized assessment given the variability in learning trajectories.</p></sec></abstract><kwd-group><kwd>emergency medicine residency</kwd><kwd>clinical exposure</kwd><kwd>learning curves</kwd><kwd>natural language processing</kwd><kwd>electronic health records</kwd><kwd>graduate medical education</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>The Challenge of Measuring Clinical Experience</title><p>The optimal duration of emergency medicine (EM) residency training remains a critical unresolved question in graduate medical education. As the Accreditation Council for Graduate Medical Education considers standardizing all programs to a 4-year model, this debate has highlighted a fundamental gap in our understanding. We lack reliable methods to measure how residents accumulate and master clinical experience across a vast spectrum of EM presentations [<xref ref-type="bibr" rid="ref1">1</xref>]. While these clinical encounters form the foundation of physician development and shape future practice patterns, programs have struggled to systematically track and optimize them, even within competency-based educational frameworks [<xref ref-type="bibr" rid="ref2">2</xref>-<xref ref-type="bibr" rid="ref5">5</xref>].</p><p>Current methods for measuring clinical exposure in EM suffer from both practical and conceptual limitations. Self-reported case logs, the traditional standard, demonstrate significant error rates due to recall bias [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. Approaches using diagnostic coding systems such as the International Classification of Diseases, 10th revision, fundamentally misalign with EM&#x2019;s paradigm [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]. The core work of emergency physicians, evaluating and ruling out life-threatening conditions, often results in nonspecific final diagnoses (eg, &#x201C;abdominal pain&#x201D;) that mask the complexity of care delivered [<xref ref-type="bibr" rid="ref12">12</xref>]. Furthermore, we know that evaluating for life-threatening illnesses within the context of abdominal pain can be confounded by mimics such as acute coronary syndrome, which are nonspecific, have a high overlap with other conditions, and while they are considered, may not appear in the final diagnosis but nonetheless expose the resident to evaluating for that condition.</p></sec><sec id="s1-2"><title>A Novel Natural Language Processing&#x2013;Based Approach</title><p>Natural language processing (NLP) of clinical documentation offers a potential breakthrough. By analyzing the comprehensive narrative content of clinical notes that capture the diagnostic reasoning process, NLP can measure case exposure with greater granularity. When combined with the Systematized Nomenclature of Medicine&#x2013;Clinical Terms, a clinical terminology system designed to represent complex medical concepts, this approach can systematically document both the breadth of conditions evaluated and the depth of clinical reasoning used. This methodological advance aligns with emerging calls for &#x201C;precision education&#x201D; in medical training, where the analysis of clinical data drives personalized learning optimization [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref13">13</xref>].</p></sec><sec id="s1-3"><title>Study Objectives</title><p>In this study, we used NLP to provide a comprehensive, data-driven analysis of EM resident development. Using electronic health record data from a single academic medical center spanning multiple resident cohorts, we pursued three objectives: (1) quantify topic exposure curves and clinical progression, mapping how residents accumulate diagnostic topic exposure over time; (2) examine variation in clinical exposure patterns between individual residents and graduating classes; and (3) analyze the distribution of clinical experiences across presentation types and complexity levels to provide empirical evidence relevant to the debate on optimal training duration.</p></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design and Population</title><p>We conducted a retrospective analysis of emergency department (ED) encounters at Stanford Hospital between July 1, 2016, and November 30, 2023. Stanford Hospital serves as the primary training site for our residency and is a high-volume academic ED and level 1 trauma center. This period captured the primary training site experiences of 4 resident classes (2020&#x2010;2023). The study included all EM residents who completed their full 4-year training during this period (n=62). The resident cohort had a mean age of 29.0 (SD 3.6) years, and 40 (64.5%) residents were male. The cohort was predominantly White (n=49, 79%) and non-Hispanic (n=60, 96.8%), with other racial identities including Asian (n=11, 17.7%), Black (n=1, 1.6%), and other (n=1, 1.6%). Encounters in which residents served as either the primary or supervisory resident were included. Resident-patient encounters were identified using the electronic health record&#x2019;s treatment team data. A rule-based algorithm was developed to attribute each encounter to the appropriate residents. Primary attribution was assigned to the first resident to document their involvement with a patient, and this was cross-referenced with shift schedule data to ensure that the encounter occurred during the resident&#x2019;s clinical duties. To account for both primary and supervisory roles, encounters were also coattributed to a senior resident if they were documented on the treatment team in close temporal proximity to a junior resident, reflecting an active supervisory role. When both junior and senior residents were assigned to an encounter, we credited topic exposure to both residents for resident-level analysis but counted each encounter once for patient and encounter-level summaries; per&#x2013;postgraduate year (PGY) proportions used denominators based on unique, non-double-counted encounters. Encounters from nonclinical or administrative shifts were excluded. Our program is a 4-year PGY1 to 4 program where the PGY4 year includes 40 weeks of ED time with a specific emphasis on developing supervisory skills and practicing with graduated responsibility.</p><p>Residents also gain clinical experience at 2 high-volume, high-acuity affiliated sites (Kaiser Santa Clara and Santa Clara Valley Medical Center) that use a different electronic health record. These data were not included in our analysis. Depending on the PGY level, these external sites constitute approximately 30% to 35% of a resident&#x2019;s total ED training time. Encounters from off-service rotations (eg, intensive care unit, anesthesia, and obstetrics) were also excluded. Residents who did not complete the program were excluded from this analysis to ensure the integrity of longitudinal exposure curve construction.</p></sec><sec id="s2-2"><title>Ethical Considerations</title><p>This study was approved as minimal-risk research by the Stanford University Institutional Review Board (IRB 69107). A waiver of informed consent was granted because the study involved secondary analysis of existing clinical documentation. Data access was authorized through the Stanford Research Repository. All data were deidentified and analyzed within a secure, Health Insurance Portability and Accountability Act&#x2013;compliant environment, and no identifiable information left the repository. The study complied with institutional and national regulations for human participants research.</p></sec><sec id="s2-3"><title>Data Sources and Variables</title><p>We extracted deidentified structured data, including patient demographics, Emergency Severity Index (ESI), and disposition status, as well as unstructured data in the form of clinical documentation from the Stanford Research Repository [<xref ref-type="bibr" rid="ref14">14</xref>]. We focused on note sections capturing resident diagnostic reasoning&#x2014;history of present illness, medical decision-making, and ED course narratives.</p></sec><sec id="s2-4"><title>NLP Overview</title><p>We developed a multistage NLP pipeline to map the narrative content of resident clinical documentation to the 895 clinical subcategories of the 2022 Model for Clinical Practice of Emergency Medicine (MCPEM) [<xref ref-type="bibr" rid="ref15">15</xref>]. Our approach used a retrieval-augmented generation framework with a Health Insurance Portability and Accountability Act&#x2013;compliant instance of Google&#x2019;s Gemini 1.5 Flash large language model, which was selected for its balance of cost-effectiveness and high performance within our institution&#x2019;s available tools [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref18">18</xref>]. This involved extracting key clinical concepts from resident notes and mapping them, as an intermediate step, to the Systematized Nomenclature of Medicine&#x2013;Clinical Terms, Clinical Observations, Recordings, and Encoding subset before final classification into MCPEM topics [<xref ref-type="bibr" rid="ref19">19</xref>]. This 2-stage process was chosen to preserve granular clinical detail while using a standardized clinical terminology.</p><p>Our retrieval-augmented pipeline can be conceptualized using standard NLP terminology as a 3-stage information retrieval (IR) to information extraction (IE) to classification process. The IR component selects relevant note sections and retrieves candidate concept matches from the Systematized Nomenclature of Medicine&#x2013;Clinical Terms. The IE component, implemented implicitly through the language model, identifies and normalizes key medical entities and filters them for contextual relevance (eg, negated, historical, or uncertain findings). The classification stage maps these normalized concepts to the MCPEM topics.</p></sec><sec id="s2-5"><title>Validation Methodology</title><p>We validated this pipeline through a manual review of 500 randomly selected encounters by 4 board-certified emergency physicians (CP, WD, JH, and RK). This process confirmed the high accuracy of our automated approach, with the model&#x2019;s classifications agreeing with the expert consensus 89.76% (377/420) of the time. The interrater reliability among the physician reviewers was substantial (&#x03BA;=0.71). A comprehensive description of the NLP architecture, model configuration, and validation methodology is provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s2-6"><title>Analysis</title><p>Our analysis focused on 3 key aspects of resident development. To appropriately account for the resident as the primary unit of analysis and the clustered nature of the data (ie, multiple encounters nested within each resident), all encounter-level data were first aggregated to the individual resident level. Statistical comparisons were performed on this resident-level dataset (N=62).</p><p>First, we constructed topic exposure curves by tracking cumulative unique topics over time. Topic exposure rates were calculated using 30-day sliding windows. We defined exposure plateaus as periods where residents encountered fewer than 1 new topic per 100 patients over 3 consecutive measurement windows. Second, we examined variation in exposure by analyzing differences in case volumes, topic coverage, and patient acuity. To quantify the equity of exposure distribution among residents within the same PGY level, we calculated the Gini coefficients. Originally developed to measure income inequality, the Gini coefficient quantifies the inequality of a frequency distribution, with values ranging from 0 (representing perfect equality) to 1 (representing perfect inequality) [<xref ref-type="bibr" rid="ref20">20</xref>]. In this context, a Gini coefficient of 0 would indicate that all residents in a cohort had the exact same volume of exposure to a given measure (eg, high-acuity cases), while a value of 1 would indicate that a single resident received all of the exposure and all others received none. This metric provides a standardized way to compare the degree of interresident variability across different clinical domains and training years. Third, we tracked clinical complexity progression using ESI scores and admission rates as proxies.</p><p>Analyses were performed using R (version 4.3.1; R Foundation for Statistical Computing) and Python (version 3.11). Statistical comparisons between classes were performed using Kruskal-Wallis tests with eta-squared effect sizes. A <italic>P</italic> value of &#x003C;.05 was considered to indicate statistical significance.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Resident Cohort</title><p>Our analysis included the primary-site training experiences of 62 EM residents from 4 graduating classes (2020&#x2010;2023). Over the course of their training, this cohort managed 244,255 patient encounters, representing 133,748 (54.8%) unique patients. Detailed demographic and clinical characteristics of the patient encounters are provided in <xref ref-type="table" rid="table1">Table 1</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Demographic and clinical characteristics of emergency department patient encounters managed by emergency medicine residents at Stanford Hospital, 2016 to 2023 (N=133,748).</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Characteristic</td><td align="left" valign="bottom">Values</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="2">Patient demographics</td></tr><tr><td align="left" valign="top">&#x2003;Age (y), mean (SD)</td><td align="left" valign="top">47.2 (25.7)</td></tr><tr><td align="left" valign="top" colspan="2">Sex, n (%)</td></tr><tr><td align="left" valign="top">&#x2003;Female</td><td align="left" valign="top">69,015 (51.6)</td></tr><tr><td align="left" valign="top">&#x2003;Male</td><td align="left" valign="top">64,666 (48.4)</td></tr><tr><td align="left" valign="top">&#x2003;Unknown</td><td align="left" valign="top">67 (0.0)</td></tr><tr><td align="left" valign="top" colspan="2">Race, n (%)</td></tr><tr><td align="left" valign="top">&#x2003;Asian</td><td align="left" valign="top">22,994 (17.2)</td></tr><tr><td align="left" valign="top">&#x2003;Black</td><td align="left" valign="top">6418 (4.8)</td></tr><tr><td align="left" valign="top">&#x2003;Native American</td><td align="left" valign="top">414 (0.3)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Pacific Islander</td><td align="left" valign="top">2469 (1.9)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Unknown</td><td align="left" valign="top">1564 (1.2)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>White</td><td align="left" valign="top">55,948 (41.8)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Other or multiple</td><td align="left" valign="top">43,939 (32.9)</td></tr><tr><td align="left" valign="top" colspan="2">Ethnicity, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hispanic or Latino</td><td align="left" valign="top">35,132 (26.3)</td></tr><tr><td align="left" valign="top">&#x2003;Non-Hispanic</td><td align="left" valign="top">96,965 (72.5)</td></tr><tr><td align="left" valign="top">&#x2003;Unknown</td><td align="left" valign="top">1649 (1.2)</td></tr><tr><td align="left" valign="top" colspan="2">Insurance, n (%)</td></tr><tr><td align="left" valign="top">&#x2003;Commercial</td><td align="left" valign="top">48,894 (36.6)</td></tr><tr><td align="left" valign="top">&#x2003;Medicare</td><td align="left" valign="top">30,357 (22.7)</td></tr><tr><td align="left" valign="top">&#x2003;Medicaid or Medi-Cal</td><td align="left" valign="top">33,632 (25.2)</td></tr><tr><td align="left" valign="top">&#x2003;Unknown</td><td align="left" valign="top">11,617 (8.7)</td></tr><tr><td align="left" valign="top">&#x2003;Other</td><td align="left" valign="top">9242 (6.9)</td></tr><tr><td align="left" valign="top" colspan="2">Primary language, n (%)</td></tr><tr><td align="left" valign="top">&#x2003;English</td><td align="left" valign="top">110,165 (82.4)</td></tr><tr><td align="left" valign="top">&#x2003;Spanish</td><td align="left" valign="top">16,371 (12.2)</td></tr><tr><td align="left" valign="top">&#x2003;Chinese languages</td><td align="left" valign="top">2257 (1.7)</td></tr><tr><td align="left" valign="top">&#x2003;Southeast Asian languages</td><td align="left" valign="top">1513 (1.1)</td></tr><tr><td align="left" valign="top">&#x2003;Other</td><td align="left" valign="top">3339 (2.5)</td></tr><tr><td align="left" valign="top" colspan="2">Interpreter services, n (%)</td></tr><tr><td align="left" valign="top">&#x2003;Interpreter needed</td><td align="left" valign="top">20,483 (15.3)</td></tr><tr><td align="left" valign="top">&#x2003;No interpreter needed</td><td align="left" valign="top">113,162 (84.6)</td></tr><tr><td align="left" valign="top">&#x2003;Unknown</td><td align="left" valign="top">103 (0.1)</td></tr><tr><td align="left" valign="top" colspan="2">Encounter characteristics</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Total patient encounters, n</td><td align="left" valign="top">244,255</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Encounters per resident, mean (95% CI)</td><td align="left" valign="top">3,940 (3,794-4,086)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Admission rate, %</td><td align="left" valign="top">35.7</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Length of stay (h), median (IQR)</td><td align="left" valign="top">4.8 (3.1&#x2010;7.2)</td></tr><tr><td align="left" valign="top" colspan="2">Emergency Severity Index, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1</td><td align="left" valign="top">2759 (1.2)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>2</td><td align="left" valign="top">57,870 (24.1)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>3</td><td align="left" valign="top">157,556 (65.7)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>4</td><td align="left" valign="top">19,766 (8.2)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>5</td><td align="left" valign="top">1894 (0.8)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Missing</td><td align="left" valign="top">4410 (1.8)</td></tr></tbody></table></table-wrap></sec><sec id="s3-2"><title>Topic Exposure Progression and Interresident Variation</title><p>EM residents demonstrated a clear, progressive acquisition of clinical topic exposure throughout training (<xref ref-type="fig" rid="figure1">Figures 1</xref><xref ref-type="fig" rid="figure2"/><xref ref-type="fig" rid="figure3"/>-<xref ref-type="fig" rid="figure4">4</xref>). The most rapid new topic exposure occurred during postgraduate year 1 (PGY1), with residents encountering a mean of 376.7 (42.1%) unique topics of the 895 MCPEM subcategories. However, PGY1 was also the year with the greatest interresident variability in topic coverage (coefficient of variation [CV]=9.1%). As residents progressed through training, the variation in total topic exposure decreased (PGY4 CV=2.8%).</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Cumulative clinical topic exposure curve for the emergency medicine graduating class of 2020 at Stanford Hospital, 2016&#x2010;2020 (n=15). The x-axis represents months of training, and the y-axis represents the mean cumulative number of unique clinical topics from the Model for Clinical Practice of Emergency Medicine encountered by residents. The curve does not reach the total of 895 Model for Clinical Practice of Emergency Medicine topics, indicating that no resident achieved 100% topic exposure during their training at the primary academic site.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="mededu_v11i1e82326_fig01.png"/></fig><p>Exposure coverage continued to increase in subsequent years, reaching a mean of 447.6 (50%) of MCPEM topics in PGY2, 515.0 (57.5%) in PGY3, and 565.9 (63.2%) in PGY4. Exposure plateaus, defined as periods with minimal new topic exposure, typically occurred in the fourth year of training; for example, the Class of 2023 reached plateaus at a mean of 39.8 (SD 3.0) months (mean 3268 encounters). However, individual variation was substantial: some residents plateaued as early as 38.2 months (2742 encounters), while others continued to encounter new topics through their final month, with final topic coverage ranging from 59.44% (532/895) to 67.26% (602/895) of all possible topics among PGY4 residents.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Cumulative clinical topic exposure curve for the emergency medicine graduating class of 2021 at Stanford Hospital, 2017&#x2010;2021 (n=16). The x-axis represents months of training, and the y-axis represents the mean cumulative number of unique clinical topics from the Model for Clinical Practice of Emergency Medicine encountered by residents. The curve does not reach the total of 895 Model for Clinical Practice of Emergency Medicine topics, indicating that no resident achieved 100% topic exposure during their training at the primary academic site.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="mededu_v11i1e82326_fig02.png"/></fig><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Cumulative clinical topic exposure curve for the emergency medicine graduating class of 2022 at Stanford Hospital, 2018&#x2010;2022 (n=15). The x-axis represents months of training, and the y-axis represents the mean cumulative number of unique clinical topics from the Model for Clinical Practice of Emergency Medicine encountered by residents. The curve does not reach the total of 895 Model for Clinical Practice of Emergency Medicine topics, indicating that no resident achieved 100% topic exposure during their training at the primary academic site.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="mededu_v11i1e82326_fig03.png"/></fig><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Cumulative clinical topic exposure curve for the emergency medicine graduating class of 2023 at Stanford Hospital, 2019&#x2010;2023 (n=16). The x-axis represents months of training, and the y-axis represents the mean cumulative number of unique clinical topics from the Model for Clinical Practice of Emergency Medicine encountered by residents. The curve does not reach the total of 895 Model for Clinical Practice of Emergency Medicine topics, indicating that no resident achieved 100% topic exposure during their training at the primary academic site.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="mededu_v11i1e82326_fig04.png"/></fig></sec><sec id="s3-3"><title>Progression of Clinical Workload and Complexity</title><p>In parallel with increasing topic exposure, residents demonstrated a progressive increase in their clinical workload and the complexity of cases managed (<xref ref-type="table" rid="table2">Table 2</xref>). Annual case volumes more than tripled from PGY1 (mean 445.7 encounters) to PGY4 (mean 1528.4 encounters). This growth in volume was accompanied by increasing case acuity, as mean ESI scores progressively decreased from 2.94 in PGY1 to 2.79 in PGY4. Correspondingly, the proportion of high-acuity patients (ESI 1&#x2010;2) managed by residents increased from 16% (4374/27,340) in PGY1 to 30.91% (9418/30,466) in PGY4, and admission rates rose from 31% (8475/27,340) to 37.50% (11425/30,466) over the same period. Notably, the CV for both clinical volume and admission rates followed a U-shaped pattern, decreasing from PGY1 to PGY3 before increasing again in PGY4.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Progression of clinical experience by postgraduate year (PGY) for emergency medicine residents (N=62), Stanford Hospital, 2016 to 2023.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">PGY1</td><td align="left" valign="bottom">PGY2</td><td align="left" valign="bottom">PGY3</td><td align="left" valign="bottom">PGY4</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="5">Annual clinical volume and complexity</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Number of encounters, mean (95% CI)</td><td align="left" valign="top">445.7 (417.6&#x2010;473.7)</td><td align="left" valign="top">772.1 (738.5&#x2010;805.8)</td><td align="left" valign="top">1193.4 (1138.5&#x2010;1248.2)</td><td align="left" valign="top">1528.4 (1429.1&#x2010;1627.8)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>ESI<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup> score, mean (95% CI)</td><td align="left" valign="top">2.94 (2.93&#x2010;2.96)</td><td align="left" valign="top">2.87 (2.85&#x2010;2.88)</td><td align="left" valign="top">2.85 (2.84&#x2010;2.87)</td><td align="left" valign="top">2.79 (2.76&#x2010;2.81)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>High-acuity cases (ESI 1&#x2010;2), n/N (%)</td><td align="left" valign="top">4374/27,340 (16)</td><td align="left" valign="top">5575/27,479 (20.2)</td><td align="left" valign="top">7398/30,101 (24.5)</td><td align="left" valign="top">9418/30,466 (30.9)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Admission rate, % (95% CI)</td><td align="left" valign="top">31.0 (29.7&#x2010;32.4)</td><td align="left" valign="top">38.3 (37.3&#x2010;39.4)</td><td align="left" valign="top">35.5 (34.6&#x2010;36.3)</td><td align="left" valign="top">37.5 (36.3&#x2010;38.8)</td></tr><tr><td align="left" valign="top" colspan="5">Cumulative topic exposure</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Cumulative unique MCPEM<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup> topics covered, mean (95% CI)</td><td align="left" valign="top">376.7 (367.9&#x2010;385.5)</td><td align="left" valign="top">447.6 (442.2&#x2010;453.0)</td><td align="left" valign="top">515.0 (510.9&#x2010;519.0)</td><td align="left" valign="top">565.9 (561.9&#x2010;569.9)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Cumulative total percentage of MCPEM covered, %</td><td align="left" valign="top">41.1</td><td align="left" valign="top">50</td><td align="left" valign="top">57.5</td><td align="left" valign="top">63.2</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>New topics encountered each year, mean (SD)</td><td align="left" valign="top">376.7 (28.4)</td><td align="left" valign="top">71.0 (18.1)</td><td align="left" valign="top">67.3 (14.1)</td><td align="left" valign="top">50.9 (13.3)</td></tr><tr><td align="left" valign="top" colspan="5">Interresident variability (CV<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup>), %</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>CV for clinical volume</td><td align="left" valign="top">24.6</td><td align="left" valign="top">17</td><td align="left" valign="top">18</td><td align="left" valign="top">25.4</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>CV for admission rate</td><td align="left" valign="top">16.4</td><td align="left" valign="top">11.1</td><td align="left" valign="top">9.5</td><td align="left" valign="top">13.4</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>CV for topic coverage</td><td align="left" valign="top">9.1</td><td align="left" valign="top">4.7</td><td align="left" valign="top">3.1</td><td align="left" valign="top">2.8</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>ESI: Emergency Severity Index.</p></fn><fn id="table2fn2"><p><sup>b</sup>MCPEM: Model for Clinical Practice of Emergency Medicine.</p></fn><fn id="table2fn3"><p><sup>c</sup>CV: coefficient of variation.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-4"><title>Distribution of Clinical Experiences</title><p>Residents&#x2019; exposure to the 895 distinct clinical topics followed a consistent pattern&#x2014;they encountered a small core of presentations (n=49, 5.5%) more than 100 times each, a larger set (n=284, 31.7%) between 10 and 100 times, and the majority (n=562, 62.9%) fewer than 10 times. Topic distribution showed moderate inequality (mean Gini coefficient=0.611), with consistency between the graduating classes (<italic>P=</italic>.61). High-acuity case exposure was more unequally distributed (Gini=0.292) than the overall case volumes (Gini=0.117).</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>Our analysis of 62 EM residents across 4 years of training revealed distinct and progressive patterns in the arc of their clinical experience. Using a novel NLP methodology on over 244,000 clinical encounters, we found that residents demonstrated a rapid acquisition of topic exposure in their first year, which continued, albeit at a slower rate, deep into their fourth year. Importantly, this continued exposure occurs in the context of increasing clinical complexity and, based on our program&#x2019;s structure, escalating supervisory responsibility. These findings provide empirical evidence that can inform the national debate on the optimal length of EM training and highlight the potential for data-driven, precision education.</p></sec><sec id="s4-2"><title>Implications for Competency-Based Medical Education</title><p>The observed pattern of topic exposure, rapid initial acquisition followed by a plateau, aligns with the power-law &#x201C;experience curves&#x201D; documented in medical education by Pusic et al [<xref ref-type="bibr" rid="ref21">21</xref>] However, it is critical to note that case exposures are merely the substrate for learning and are not all equal in value toward developing competence. The conversion of these experiences into durable competence is a complex process mediated by the <italic>deliberate</italic> components of the theory of deliberate practice by Ericsson [<xref ref-type="bibr" rid="ref22">22</xref>], such as feedback, reflection, and coaching [<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref24">24</xref>]. Indeed, recent research has shown that even established competency measures, such as milestones, may not directly correlate with early-career patient outcomes, cautioning against a simple equation of more exposure with more competence [<xref ref-type="bibr" rid="ref25">25</xref>]. Therefore, the primary value of the exposure data we present lies in its ability to serve as a powerful objective input for these established educational frameworks. At our institution, for example, these components are formalized through a resident coaching program and a quarterly Clinical Competency Committee, systems for which this objective exposure data can provide a more precise foundation for assessment and goal-setting, and tracking progress toward the Accreditation Council for Graduate Medical Education milestones [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref26">26</xref>].</p></sec><sec id="s4-3"><title>Informing the Debate on Training Duration</title><p>A central question for the EM as a specialty is whether a 3- or 4-year training model is optimal. Our data provide empirical evidence relevant to this debate. The finding that residents continue to acquire a mean of 50.9 new core topics in their PGY4 year, representing a 9.9% (51/515) increase over PGY3, suggests that the fourth year offers more than just redundant experience. This quantitative increase is accompanied by a significant qualitative shift&#x2014;PGY4 residents manage a higher proportion of high-acuity patients (ESI 1&#x2010;2) and cases requiring hospitalization. This exposure to a more complex and challenging case mix, as supported by work from Lam et al [<xref ref-type="bibr" rid="ref10">10</xref>] and Zhou et al [<xref ref-type="bibr" rid="ref27">27</xref>], is critical for developing the advanced diagnostic reasoning necessary for independent practice.</p></sec><sec id="s4-4"><title>Understanding Interresident Variation</title><p>Our analysis also revealed significant interresident variation, particularly in the timing of exposure plateaus and in the experience with high-acuity cases. This aligns with findings from other specialties and supports a more personalized view of competency development [<xref ref-type="bibr" rid="ref28">28</xref>]. This variability is likely to be driven by a combination of systemic factors and resident choices. We propose framing this variability within the concept of &#x201C;warranted versus unwarranted variation&#x201D; as described by Holmboe and Kogan [<xref ref-type="bibr" rid="ref29">29</xref>]. While some variation is an expected and even desirable feature of individualized learning, our NLP-based tool provides a mechanism for programs to identify potentially unwarranted gaps in exposure to core experiences. Notably, the decreasing CV in total topic coverage from PGY1 (9.1%) to PGY4 (2.8%) suggests that a longer training duration may lead to a more standardized and equitable clinical experience among graduates.</p><p>The U-shaped pattern observed in the variability of clinical volume and admission rates is an intriguing finding. We hypothesize that this reflects the evolving roles within our program&#x2014;PGY1 residents have variable schedules due to numerous off-service rotations; PGY2 and PGY3 residents assume more structured supervisory roles within a pod system, which may standardize their workflow and decrease variability; finally, in PGY4, residents are granted greater autonomy to run a pod independently while also supervising junior residents, potentially allowing individual practice styles to reemerge at increasing variability.</p></sec><sec id="s4-5"><title>Bridging the Curriculum-Practice Gap and Methodological Advantages</title><p>A key finding of this study is that even after 4 years, residents were not exposed to over a third of the topics listed in the MCPEM (329/895, 36.76%). This highlights the fundamental tension between the prescribed curriculum and the reality of clinical practice. Achieving 100% topic coverage is likely an unachievable goal for any single residency program. The true aim of training is not encyclopedic exposure but rather developing the core competencies and adaptive expertise required for safe, independent practice and effective lifelong learning. Our NLP-based methodology offers a powerful, dual-pronged approach to address this gap. At the local program level, it serves as a diagnostic tool, enabling educators to identify and amend exposure gaps through targeted interventions, such as simulation. More broadly, the scalability of this approach presents an opportunity to transform the specialty&#x2019;s understanding of its own work. If applied across multiple institutions, this method could create a dynamic, data-driven map of the actual clinical practice of EM, providing an evidence base for future revisions of the MCPEM. This would allow the model to better reflect the true prevalence and complexity of conditions encountered in contemporary practice, ensuring a more authentic alignment between what is taught, what is tested, and what is practiced. Nonetheless, there will likely always remain a set of high-acuity, low-frequency conditions for which training programs must prescribe exposure through didactics, as real-world encounters will be too rare to ensure universal competence.</p><p>A key advantage of this methodology is its practical implementation. Traditional NLP pipelines often require a substantial upfront investment in manual data annotation for model training and specialized expertise. In contrast, our retrieval-augmented generation approach takes advantage of a pretrained large language model that requires no model-specific training, dramatically reducing the implementation complexity. To offer a concrete sense of financial feasibility, the total cost for the application programming interface calls to process all 244,255 clinical encounters for this study was approximately US $180, demonstrating the financial accessibility of this approach for programs seeking to adopt data-driven educational strategies. Framing our pipeline in IR and IE terms also clarifies where most misclassifications arise&#x2014;either from retrieval scope or from information-extraction phenomena such as negation or temporality&#x2014;providing a useful structure for future error analysis and comparison to traditional rule-based clinical NLP systems.</p></sec><sec id="s4-6"><title>Limitations</title><p>This study has several limitations. As a single-institution study, our findings may not be generalizable to programs with a 3-year training format, or to institutions operating in different clinical settings. A primary limitation is that our analysis excludes data from additional training sites, which constitute a significant proportion of resident training (approximately 30%&#x2010;35% of ED time, depending on the PGY level), and from off-service rotation where key procedural and critical care exposures occur (eg, anesthesia, intensive care unit, etc). The training period for our cohorts also overlapped with the COVID-19 pandemic, which may have influenced case volumes and mix, although the remarkable consistency of exposure patterns we observed across the 4 classes mitigates this concern. Finally, although our NLP approach achieved high accuracy in classifying clinical encounters (89.7% agreement with physician review), this methodology relies on the comprehensiveness of resident documentation, which may vary between individuals and over time.</p><p>In conclusion, our analysis reveals both consistent patterns in resident clinical exposure and substantial individual variation in topic exposure trajectories. The finding that many residents continue to encounter new clinical topics into their fourth year provides empirical evidence for the potential educational value of a 4-year training model. NLP of clinical documentation offers EM programs a powerful and accessible tool to objectively measure and optimize resident clinical experiences based on actual exposure patterns, moving beyond traditional metrics to foster a more precise, data-informed, and equitable approach to graduate medical education.</p></sec></sec></body><back><notes><sec><title>Funding</title><p>No external financial support or grants were received from any public, commercial, or not-for-profit entities for the research, authorship, or publication of this article.</p></sec><sec><title>Data Availability</title><p>The datasets generated or analyzed during this study are available from the corresponding author upon reasonable request.</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization (lead): CP, CR</p><p>Methodology (lead): CP, JH; (supporting): RK, CR</p><p>Software (lead): CP</p><p>Data curation (lead): CP</p><p>Formal analysis (lead): CP</p><p>Writing&#x2013;original draft (lead): CP, JH, CR; (supporting): RK, WD</p><p>Writing&#x2013;review &#x0026; editing (equal): CP, JH, RK, WD, CR</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">CV</term><def><p>coefficient of variation</p></def></def-item><def-item><term id="abb2">ED</term><def><p>emergency department</p></def></def-item><def-item><term id="abb3">EM</term><def><p>emergency medicine</p></def></def-item><def-item><term id="abb4">ESI</term><def><p>Emergency Severity Index</p></def></def-item><def-item><term id="abb5">IE</term><def><p>information extraction</p></def></def-item><def-item><term id="abb6">IR</term><def><p>information retrieval</p></def></def-item><def-item><term id="abb7">MCPEM</term><def><p>Model for Clinical Practice of Emergency Medicine</p></def></def-item><def-item><term id="abb8">NLP</term><def><p>natural language processing</p></def></def-item><def-item><term id="abb9">PGY</term><def><p>postgraduate year</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="web"><article-title>ACGME program requirements for graduate medical education in emergency medicine</article-title><source>Accreditation Council for Graduate Medical Education</source><year>2025</year><access-date>2025-03-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.acgme.org/globalassets/pfassets/reviewandcomment/2025/110_emergencymedicine_rc_02122025.pdf">https://www.acgme.org/globalassets/pfassets/reviewandcomment/2025/110_emergencymedicine_rc_02122025.pdf</ext-link></comment></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sebok-Syer</surname><given-names>SS</given-names> </name><name name-style="western"><surname>Shepherd</surname><given-names>L</given-names> </name><name name-style="western"><surname>McConnell</surname><given-names>A</given-names> </name><name name-style="western"><surname>Dukelow</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Sedran</surname><given-names>R</given-names> </name><name name-style="western"><surname>Lingard</surname><given-names>L</given-names> </name></person-group><article-title>&#x201C;EMERGing&#x201D; electronic health record data metrics: insights and implications for assessing residents&#x2019; clinical performance in emergency medicine</article-title><source>AEM Educ Train</source><year>2020</year><month>08</month><day>9</day><volume>5</volume><issue>2</issue><fpage>e10501</fpage><pub-id pub-id-type="doi">10.1002/aet2.10501</pub-id><pub-id pub-id-type="medline">33898906</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sirovich</surname><given-names>BE</given-names> </name><name name-style="western"><surname>Lipner</surname><given-names>RS</given-names> </name><name name-style="western"><surname>Johnston</surname><given-names>M</given-names> </name><name name-style="western"><surname>Holmboe</surname><given-names>ES</given-names> </name></person-group><article-title>The association between residency training and internists&#x2019; ability to practice conservatively</article-title><source>JAMA Intern Med</source><year>2014</year><month>10</month><volume>174</volume><issue>10</issue><fpage>1640</fpage><lpage>1648</lpage><pub-id pub-id-type="doi">10.1001/jamainternmed.2014.3337</pub-id><pub-id pub-id-type="medline">25179515</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>C</given-names> </name><name name-style="western"><surname>Petterson</surname><given-names>S</given-names> </name><name name-style="western"><surname>Phillips</surname><given-names>R</given-names> </name><name name-style="western"><surname>Bazemore</surname><given-names>A</given-names> </name><name name-style="western"><surname>Mullan</surname><given-names>F</given-names> </name></person-group><article-title>Spending patterns in region of residency training and subsequent expenditures for care provided by practicing physicians for Medicare beneficiaries</article-title><source>JAMA</source><year>2014</year><month>12</month><day>10</day><volume>312</volume><issue>22</issue><fpage>2385</fpage><lpage>2393</lpage><pub-id pub-id-type="doi">10.1001/jama.2014.15973</pub-id><pub-id pub-id-type="medline">25490329</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Burk-Rafel</surname><given-names>J</given-names> </name><name name-style="western"><surname>Drake</surname><given-names>CB</given-names> </name><name name-style="western"><surname>Sartori</surname><given-names>DJ</given-names> </name></person-group><article-title>Characterizing residents&#x2019; clinical experiences-a step toward precision education</article-title><source>JAMA Netw Open</source><year>2024</year><month>12</month><day>2</day><volume>7</volume><issue>12</issue><fpage>e2450774</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2024.50774</pub-id><pub-id pub-id-type="medline">39693075</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Langdorf</surname><given-names>MI</given-names> </name><name name-style="western"><surname>Strange</surname><given-names>G</given-names> </name><name name-style="western"><surname>Macneil</surname><given-names>P</given-names> </name></person-group><article-title>Computerized tracking of emergency medicine resident clinical experience</article-title><source>Ann Emerg Med</source><year>1990</year><month>07</month><volume>19</volume><issue>7</issue><fpage>764</fpage><lpage>773</lpage><pub-id pub-id-type="doi">10.1016/s0196-0644(05)81700-7</pub-id><pub-id pub-id-type="medline">2389860</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nagler</surname><given-names>J</given-names> </name><name name-style="western"><surname>Harper</surname><given-names>MB</given-names> </name><name name-style="western"><surname>Bachur</surname><given-names>RG</given-names> </name></person-group><article-title>An automated electronic case log: using electronic information systems to assess training in emergency medicine</article-title><source>Acad Emerg Med</source><year>2006</year><month>07</month><volume>13</volume><issue>7</issue><fpage>733</fpage><lpage>739</lpage><pub-id pub-id-type="doi">10.1197/j.aem.2006.02.010</pub-id><pub-id pub-id-type="medline">16723724</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rhee</surname><given-names>DW</given-names> </name><name name-style="western"><surname>Reinstein</surname><given-names>I</given-names> </name><name name-style="western"><surname>Jrada</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Mapping hospital data to characterize residents&#x2019; educational experiences</article-title><source>BMC Med Educ</source><year>2022</year><month>06</month><day>25</day><volume>22</volume><issue>1</issue><fpage>496</fpage><pub-id pub-id-type="doi">10.1186/s12909-022-03561-x</pub-id><pub-id pub-id-type="medline">35752814</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rhee</surname><given-names>DW</given-names> </name><name name-style="western"><surname>Chun</surname><given-names>JW</given-names> </name><name name-style="western"><surname>Stern</surname><given-names>DT</given-names> </name><name name-style="western"><surname>Sartori</surname><given-names>DJ</given-names> </name></person-group><article-title>Experience and education in residency training: capturing the resident experience by mapping clinical data</article-title><source>Acad Med</source><year>2022</year><month>02</month><day>1</day><volume>97</volume><issue>2</issue><fpage>228</fpage><lpage>232</lpage><pub-id pub-id-type="doi">10.1097/ACM.0000000000004162</pub-id><pub-id pub-id-type="medline">33983144</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lam</surname><given-names>AC</given-names> </name><name name-style="western"><surname>Tang</surname><given-names>B</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Variation in case exposure during internal medicine residency</article-title><source>JAMA Netw Open</source><year>2024</year><month>12</month><day>2</day><volume>7</volume><issue>12</issue><fpage>e2450768</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2024.50768</pub-id><pub-id pub-id-type="medline">39693070</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lam</surname><given-names>AC</given-names> </name><name name-style="western"><surname>Tang</surname><given-names>B</given-names> </name><name name-style="western"><surname>Lalwani</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Methodology paper for the General Medicine Inpatient Initiative Medical Education Database (GEMINI MedED): a retrospective cohort study of internal medicine resident case-mix, clinical care and patient outcomes</article-title><source>BMJ Open</source><year>2022</year><month>09</month><day>23</day><volume>12</volume><issue>9</issue><fpage>e062264</fpage><pub-id pub-id-type="doi">10.1136/bmjopen-2022-062264</pub-id><pub-id pub-id-type="medline">36153026</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bischof</surname><given-names>JJ</given-names> </name><name name-style="western"><surname>Emerson</surname><given-names>G</given-names> </name><name name-style="western"><surname>Mitzman</surname><given-names>J</given-names> </name><name name-style="western"><surname>Khandelwal</surname><given-names>S</given-names> </name><name name-style="western"><surname>Way</surname><given-names>DP</given-names> </name><name name-style="western"><surname>Southerland</surname><given-names>LT</given-names> </name></person-group><article-title>Does the emergency medicine in-training examination accurately reflect residents&#x2019; clinical experiences?</article-title><source>AEM Educ Train</source><year>2019</year><month>09</month><day>19</day><volume>3</volume><issue>4</issue><fpage>317</fpage><lpage>322</lpage><pub-id pub-id-type="doi">10.1002/aet2.10381</pub-id><pub-id pub-id-type="medline">31637348</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Triola</surname><given-names>MM</given-names> </name><name name-style="western"><surname>Burk-Rafel</surname><given-names>J</given-names> </name></person-group><article-title>Precision medical education</article-title><source>Acad Med</source><year>2023</year><month>07</month><day>1</day><volume>98</volume><issue>7</issue><fpage>775</fpage><lpage>781</lpage><pub-id pub-id-type="doi">10.1097/ACM.0000000000005227</pub-id><pub-id pub-id-type="medline">37027222</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Weber</surname><given-names>SC</given-names> </name><name name-style="western"><surname>Pallas</surname><given-names>J</given-names> </name><name name-style="western"><surname>Olson</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Compliant self service access to secondary use clinical data at stanford medicine</article-title><source>arXiv</source><comment>Preprint posted online on  Dec 5, 2024</comment><pub-id pub-id-type="doi">10.48550/arxiv.2412.04248</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Beeson</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Bhat</surname><given-names>R</given-names> </name><name name-style="western"><surname>Broder</surname><given-names>JS</given-names> </name><etal/></person-group><article-title>The 2022 model of the clinical practice of emergency medicine</article-title><source>J Emerg Med</source><year>2023</year><month>06</month><volume>64</volume><issue>6</issue><fpage>659</fpage><lpage>695</lpage><pub-id pub-id-type="doi">10.1016/j.jemermed.2023.02.016</pub-id><pub-id pub-id-type="medline">37244783</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="web"><article-title>Gemini models</article-title><source>Google AI for Developers</source><access-date>2025-03-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://ai.google.dev/gemini-api/docs/models">https://ai.google.dev/gemini-api/docs/models</ext-link></comment></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Klang</surname><given-names>E</given-names> </name><name name-style="western"><surname>Tessler</surname><given-names>I</given-names> </name><name name-style="western"><surname>Apakama</surname><given-names>DU</given-names> </name><etal/></person-group><article-title>Assessing retrieval-augmented large language model performance in emergency department ICD-10-CM coding compared to human coders</article-title><source>medRxiv</source><comment>Preprint posted online on  Oct 17, 2024</comment><pub-id pub-id-type="doi">10.1101/2024.10.15.24315526</pub-id><pub-id pub-id-type="medline">39484238</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>D&#x2019;Oosterlinck</surname><given-names>K</given-names> </name><name name-style="western"><surname>Khattab</surname><given-names>O</given-names> </name><name name-style="western"><surname>Remy</surname><given-names>F</given-names> </name><name name-style="western"><surname>Demeester</surname><given-names>T</given-names> </name><name name-style="western"><surname>Develder</surname><given-names>C</given-names> </name><name name-style="western"><surname>Potts</surname><given-names>C</given-names> </name></person-group><article-title>In-context learning for extreme multi-label classification</article-title><source>arXiv</source><comment>Preprint posted online on  Jan 22, 2024</comment><pub-id pub-id-type="doi">10.48550/arXiv.2401.12178</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="web"><article-title>The CORE problem list subset of SNOMED CT&#x00AE;</article-title><source>US National Library of Medicine</source><access-date>2025-03-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.nlm.nih.gov/research/umls/Snomed/core_subset.html">https://www.nlm.nih.gov/research/umls/Snomed/core_subset.html</ext-link></comment></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Thomas</surname><given-names>V</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Fan</surname><given-names>X</given-names> </name></person-group><article-title>Measuring education inequality: Gini coefficients of education</article-title><source>Social Science Research Network</source><year>2001</year><access-date>2025-06-12</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://papers.ssrn.com/abstract=258182">https://papers.ssrn.com/abstract=258182</ext-link></comment></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pusic</surname><given-names>MV</given-names> </name><name name-style="western"><surname>Kessler</surname><given-names>D</given-names> </name><name name-style="western"><surname>Szyld</surname><given-names>D</given-names> </name><name name-style="western"><surname>Kalet</surname><given-names>A</given-names> </name><name name-style="western"><surname>Pecaric</surname><given-names>M</given-names> </name><name name-style="western"><surname>Boutis</surname><given-names>K</given-names> </name></person-group><article-title>Experience curves as an organizing framework for deliberate practice in emergency medicine learning</article-title><source>Acad Emerg Med</source><year>2012</year><month>12</month><volume>19</volume><issue>12</issue><fpage>1476</fpage><lpage>1480</lpage><pub-id pub-id-type="doi">10.1111/acem.12043</pub-id><pub-id pub-id-type="medline">23230958</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ericsson</surname><given-names>KA</given-names> </name></person-group><article-title>Deliberate practice and the acquisition and maintenance of expert performance in medicine and related domains</article-title><source>Acad Med</source><year>2004</year><month>10</month><volume>79</volume><issue>10 Suppl</issue><fpage>S70</fpage><lpage>S81</lpage><pub-id pub-id-type="doi">10.1097/00001888-200410001-00022</pub-id><pub-id pub-id-type="medline">15383395</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Natesan</surname><given-names>S</given-names> </name><name name-style="western"><surname>Jordan</surname><given-names>J</given-names> </name><name name-style="western"><surname>Sheng</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Feedback in medical education: an evidence-based guide to best practices from the Council of Residency Directors in Emergency Medicine</article-title><source>West J Emerg Med</source><year>2023</year><month>05</month><day>5</day><volume>24</volume><issue>3</issue><fpage>479</fpage><lpage>494</lpage><pub-id pub-id-type="doi">10.5811/westjem.56544</pub-id><pub-id pub-id-type="medline">37278777</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fredette</surname><given-names>J</given-names> </name><name name-style="western"><surname>Michalec</surname><given-names>B</given-names> </name><name name-style="western"><surname>Billet</surname><given-names>A</given-names> </name><etal/></person-group><article-title>A qualitative assessment of emergency medicine residents&#x2019; receptivity to feedback</article-title><source>AEM Educ Train</source><year>2021</year><month>08</month><day>1</day><volume>5</volume><issue>4</issue><fpage>e10658</fpage><pub-id pub-id-type="doi">10.1002/aet2.10658</pub-id><pub-id pub-id-type="medline">34527849</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kendrick</surname><given-names>DE</given-names> </name><name name-style="western"><surname>Thelen</surname><given-names>AE</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Association of surgical resident competency ratings with patient outcomes</article-title><source>Acad Med</source><year>2023</year><month>07</month><day>1</day><volume>98</volume><issue>7</issue><fpage>813</fpage><lpage>820</lpage><pub-id pub-id-type="doi">10.1097/ACM.0000000000005157</pub-id><pub-id pub-id-type="medline">36724304</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sebok-Syer</surname><given-names>SS</given-names> </name><name name-style="western"><surname>Shaw</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Sedran</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Facilitating residents&#x2019; understanding of electronic health record report card data using faculty feedback and coaching</article-title><source>Acad Med</source><year>2022</year><month>11</month><day>1</day><volume>97</volume><issue>11S</issue><fpage>S22</fpage><lpage>S28</lpage><pub-id pub-id-type="doi">10.1097/ACM.0000000000004900</pub-id><pub-id pub-id-type="medline">35947480</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhou</surname><given-names>L</given-names> </name><name name-style="western"><surname>Cai</surname><given-names>C</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>R</given-names> </name><name name-style="western"><surname>Qi</surname><given-names>Y</given-names> </name></person-group><article-title>Effectiveness of scaffolded case-based learning in anesthesiology residency training: a randomized controlled trial</article-title><source>BMC Med Educ</source><year>2025</year><month>05</month><day>8</day><volume>25</volume><issue>1</issue><fpage>672</fpage><pub-id pub-id-type="doi">10.1186/s12909-025-07236-1</pub-id><pub-id pub-id-type="medline">40340724</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Frank</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Snell</surname><given-names>LS</given-names> </name><name name-style="western"><surname>Cate</surname><given-names>OT</given-names> </name><etal/></person-group><article-title>Competency-based medical education: theory to practice</article-title><source>Med Teach</source><year>2010</year><volume>32</volume><issue>8</issue><fpage>638</fpage><lpage>645</lpage><pub-id pub-id-type="doi">10.3109/0142159X.2010.501190</pub-id><pub-id pub-id-type="medline">20662574</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Holmboe</surname><given-names>ES</given-names> </name><name name-style="western"><surname>Kogan</surname><given-names>JR</given-names> </name></person-group><article-title>Will any road get you there? Examining warranted and unwarranted variation in medical education</article-title><source>Acad Med</source><year>2022</year><month>08</month><day>1</day><volume>97</volume><issue>8</issue><fpage>1128</fpage><lpage>1136</lpage><pub-id pub-id-type="doi">10.1097/ACM.0000000000004667</pub-id><pub-id pub-id-type="medline">35294414</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Technical description of the natural language processing pipeline, validation procedures, and statistical analysis methods.</p><media xlink:href="mededu_v11i1e82326_app1.docx" xlink:title="DOCX File, 36 KB"/></supplementary-material></app-group></back></article>