<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="letter" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JME</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Educ</journal-id>
      <journal-title>JMIR Medical Education</journal-title>
      <issn pub-type="epub">2369-3762</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v9i1e48780</article-id>
      <article-id pub-id-type="pmid">37728965</article-id>
      <article-id pub-id-type="doi">10.2196/48780</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Research Letter</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Research Letter</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Anki Tagger: A Generative AI Tool for Aligning Third-Party Resources to Preclinical Curriculum</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>de Azevedo Cardoso</surname>
            <given-names>Taiane</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Senst</surname>
            <given-names>Benjamin</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Arya</surname>
            <given-names>Savita</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Pendergrast</surname>
            <given-names>Tricia</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2396-9100</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Chalmers</surname>
            <given-names>Zachary</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>Northwestern University Feinberg School of Medicine</institution>
            <addr-line>303 E Chicago Ave</addr-line>
            <addr-line>Morton 1-670</addr-line>
            <addr-line>Chicago, IL, 60611</addr-line>
            <country>United States</country>
            <phone>1 3125038194</phone>
            <email>zachary.chalmers@northwestern.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1012-8529</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Anesthesiology</institution>
        <institution>University of Michigan Medicine</institution>
        <addr-line>Ann Arbor, MI</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Northwestern University Feinberg School of Medicine</institution>
        <addr-line>Chicago, IL</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Zachary Chalmers <email>zachary.chalmers@northwestern.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>20</day>
        <month>9</month>
        <year>2023</year>
      </pub-date>
      <volume>9</volume>
      <elocation-id>e48780</elocation-id>
      <history>
        <date date-type="received">
          <day>6</day>
          <month>7</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>26</day>
          <month>7</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>1</day>
          <month>8</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>17</day>
          <month>8</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Tricia Pendergrast, Zachary Chalmers. Originally published in JMIR Medical Education (https://mededu.jmir.org), 20.09.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Education, is properly cited. The complete bibliographic information, a link to the original publication on https://mededu.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://mededu.jmir.org/2023/1/e48780" xlink:type="simple"/>
      <abstract>
        <p>Using large language models, we developed a method to efficiently query existing flashcard libraries and select those most relevant to an individual's medical school curricula.</p>
      </abstract>
      <kwd-group>
        <kwd>ChatGPT</kwd>
        <kwd>undergraduate medical education</kwd>
        <kwd>large language models</kwd>
        <kwd>Anki</kwd>
        <kwd>flashcards</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>AI</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>ChatGPT is a natural language processing tool that uses deep learning to generate responses to questions from human users [<xref ref-type="bibr" rid="ref1">1</xref>]. ChatGPT has many possible applications in health care and medical education [<xref ref-type="bibr" rid="ref2">2</xref>].</p>
      <p>Medical students complete much of their preclinical didactic learning outside of the classroom, with the assistance of third-party resources such as Anki flashcard decks, instead of traditional lectures [<xref ref-type="bibr" rid="ref3">3</xref>]. Anki flashcard decks use the principle of spaced repetition to improve memorization [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. Medical students found Anki flashcards produced for their specific curriculum helpful and believed that these flashcards reduced anxiety. However, most medical students use open-sourced flashcards available online [<xref ref-type="bibr" rid="ref6">6</xref>]. These decks are maintained by medical students who collaborate using the social media platform Reddit (/r/medicalschoolanki) [<xref ref-type="bibr" rid="ref7">7</xref>] and through a subscription-based web application that facilitates crowdsourced peer review of flashcard content [<xref ref-type="bibr" rid="ref8">8</xref>]. Medical students work together to address errors in the flashcards and update them as needed.</p>
      <p>Use of crowdsourced flashcard decks eliminates the investment of time required upfront to produce flashcards for each lecture, but these flashcards are not specific to the user’s medical school curriculum [<xref ref-type="bibr" rid="ref4">4</xref>]. A mechanism to match existing flashcards, created and vetted by medical students within the Reddit and AnkiHub communities, to the learning goals of didactic lectures delivered by medical school faculty members would be less time-intensive for faculty and students. In this research letter, we describe a novel method to efficiently select relevant flashcards from existing Anki decks and associate those cards with individual lectures within the user’s medical school curriculum.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <p>There are 4 core steps in the workflow (<xref rid="figure1" ref-type="fig">Figure 1</xref>)<italic>.</italic> The cards of a target Anki deck are embedded in a large language model (LLM). The gpt-3.5-turbo-16k model summarizes the learning guide into a set of comprehensive learning questions. Cards are presorted for their relevance to the learning question, using the LLM deck embedding, and then gpt-3.5-turbo scores the relevance of these cards to the learning question<italic>,</italic> which continues until a user-defined query limit for the learning question has been reached. Finally, cards are tagged in the original Anki file, stratified into “highly relevant,” “somewhat relevant,” or “minimally relevant” categories. Technical documentation and scripts are deposited in GitHub [<xref ref-type="bibr" rid="ref9">9</xref>].</p>
      <fig id="figure1" position="float">
        <label>Figure 1</label>
        <caption>
          <p>Workflow schematic.</p>
        </caption>
        <graphic xlink:href="mededu_v9i1e48780_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>Using the method described above, we selected flashcards from the AnKing flashcard deck that contained 35,152 flashcards and tagged them to our institution’s preclinical curriculum (<xref rid="figure2" ref-type="fig">Figure 2</xref>) [<xref ref-type="bibr" rid="ref8">8</xref>]. We obtained a total of 465 science of medicine lecture guides spanning the 15 system-based modules at Feinberg School of Medicine for the 2022-2023 academic year. For each lecture guide, an average of 13 (range 5-34) summary learning questions were generated by our algorithm. For example, a lecture on central nervous system cancers, might include the following questions: “How do we diagnose and treat gliomas?” and “What genetic syndromes are associated with benign and malignant tumors in the brain?” After generating 4918 unique learning questions, the selection algorithm yielded a total of 21,400 flashcards from the AnKing deck, of which 16,113 were designated as highly relevant to a learning question. On average, 88 (range 11-221) flashcards were selected per lecture. Upon inspection of a sample of lectures, the quality of selections was considered high, with &#62;90% of cards appearing highly relevant. The process developed is highly scalable, with individual lecture guides processed in minutes at minimal computational cost.</p>
      <fig id="figure2" position="float">
        <label>Figure 2</label>
        <caption>
          <p>Hierarchical tag structure.</p>
        </caption>
        <graphic xlink:href="mededu_v9i1e48780_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <p>It is up to medical schools to decide how to adapt to a status quo increasingly defined by student-driven medical education. One possibility is for medical schools to align the student-driven curriculum with the instructor-led curriculum and consider the incorporation of vetted, third-party resources, such as Anki, into didactic learning [<xref ref-type="bibr" rid="ref3">3</xref>].</p>
      <p>Using large language models, we developed a method to efficiently query flashcards in existing widely used libraries and select those most relevant to an individual's medical school curricula. The feasibility of implementing a ChatGPT flashcard generation into pre-clerkship medical school curricula has not been evaluated and is an area of future study, with algorithmic fine-tuning and prompt optimization likely to further increase the specificity of selections Subsequently, a comparison of medical students’ satisfaction with self-made Anki flashcards compared to ChatGPT-tagged Anki flashcard decks should be conducted.</p>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gilson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Safranek</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Socrates</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Chi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Chartash</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>How does ChatGPT perform on the United States Medical Licensing Examination? the implications of large language models for medical education and knowledge assessment</article-title>
          <source>JMIR Med Educ</source>
          <year>2023</year>
          <month>02</month>
          <day>08</day>
          <volume>9</volume>
          <fpage>e45312</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2023//e45312/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/45312</pub-id>
          <pub-id pub-id-type="medline">36753318</pub-id>
          <pub-id pub-id-type="pii">v9i1e45312</pub-id>
          <pub-id pub-id-type="pmcid">PMC9947764</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ayoub</surname>
              <given-names>NF</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Grimm</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Balakrishnan</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Comparison between ChatGPT and Google Search as sources of postoperative patient instructions</article-title>
          <source>JAMA Otolaryngol Head Neck Surg</source>
          <year>2023</year>
          <month>06</month>
          <day>01</day>
          <volume>149</volume>
          <issue>6</issue>
          <fpage>556</fpage>
          <lpage>558</lpage>
          <pub-id pub-id-type="doi">10.1001/jamaoto.2023.0704</pub-id>
          <pub-id pub-id-type="medline">37103921</pub-id>
          <pub-id pub-id-type="pii">2804300</pub-id>
          <pub-id pub-id-type="pmcid">PMC10141286</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Gruppuso</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Adashi</surname>
              <given-names>EY</given-names>
            </name>
          </person-group>
          <article-title>The self-directed medical student curriculum</article-title>
          <source>JAMA</source>
          <year>2021</year>
          <month>11</month>
          <day>23</day>
          <volume>326</volume>
          <issue>20</issue>
          <fpage>2005</fpage>
          <lpage>2006</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2021.16312</pub-id>
          <pub-id pub-id-type="medline">34724030</pub-id>
          <pub-id pub-id-type="pii">2785917</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wothe</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Wanberg</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hohle</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Sakher</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Bosacker</surname>
              <given-names>LE</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Olson</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Satin</surname>
              <given-names>DJ</given-names>
            </name>
          </person-group>
          <article-title>Academic and wellness outcomes associated with use of Anki spaced repetition software in medical school</article-title>
          <source>J Med Educ Curric Dev</source>
          <year>2023</year>
          <month>05</month>
          <day>08</day>
          <volume>10</volume>
          <fpage>23821205231173289</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/23821205231173289?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/23821205231173289</pub-id>
          <pub-id pub-id-type="medline">37187920</pub-id>
          <pub-id pub-id-type="pii">10.1177_23821205231173289</pub-id>
          <pub-id pub-id-type="pmcid">PMC10176558</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jape</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bullock</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A spaced-repetition approach to enhance medical student learning and engagement in medical pharmacology</article-title>
          <source>BMC Med Educ</source>
          <year>2022</year>
          <month>05</month>
          <day>02</day>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>337</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmededuc.biomedcentral.com/articles/10.1186/s12909-022-03324-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12909-022-03324-8</pub-id>
          <pub-id pub-id-type="medline">35501765</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12909-022-03324-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC9063128</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rana</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Laoteppitaks</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Troutman</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chandra</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>An investigation of Anki Flashcards as a study tool among first year medical students learning anatomy</article-title>
          <source>The FASEB Journal</source>
          <year>2020</year>
          <month>04</month>
          <day>20</day>
          <volume>34</volume>
          <issue>S1</issue>
          <fpage>1</fpage>
          <lpage>1</lpage>
          <pub-id pub-id-type="doi">10.1096/fasebj.2020.34.s1.09736</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <article-title>Medical School Anki</article-title>
          <source>Reddit</source>
          <access-date>2023-06-22</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.reddit.com/r/medicalschoolanki/">https://www.reddit.com/r/medicalschoolanki/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="web">
          <source>AnkiHub</source>
          <access-date>2023-06-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ankihub.net/">https://www.ankihub.net/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="web">
          <article-title>zachalmers - Anki_Tagger</article-title>
          <source>GitHub</source>
          <access-date>2023-09-15</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/zachalmers/Anki_Tagger">https://github.com/zachalmers/Anki_Tagger</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
