<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JME</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Educ</journal-id>
      <journal-title>JMIR Medical Education</journal-title>
      <issn pub-type="epub">2369-3762</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v8i2e30988</article-id>
      <article-id pub-id-type="pmid">35486423</article-id>
      <article-id pub-id-type="doi">10.2196/30988</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Video-Based Communication Assessment of Physician Error Disclosure Skills by Crowdsourced Laypeople and Patient Advocates Who Experienced Medical Harm: Reliability Assessment With Generalizability Theory</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Leung</surname>
            <given-names>Tiffany</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Suppan</surname>
            <given-names>Laurent</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Wolfe</surname>
            <given-names>Hill</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>White</surname>
            <given-names>Andrew A</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Medicine</institution>
            <institution>University of Washington School of Medicine</institution>
            <addr-line>Box 356429</addr-line>
            <addr-line>1959 Pacific St</addr-line>
            <addr-line>Seattle, WA, 98195</addr-line>
            <country>United States</country>
            <phone>1 206 616 1447</phone>
            <fax>1 206 221 8732</fax>
            <email>andwhite@uw.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9859-0947</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>King</surname>
            <given-names>Ann M</given-names>
          </name>
          <degrees>MA</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6994-9711</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>D’Addario</surname>
            <given-names>Angelo E</given-names>
          </name>
          <degrees>MA</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7687-3049</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Brigham</surname>
            <given-names>Karen Berg</given-names>
          </name>
          <degrees>JD, MPH</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3852-7591</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Dintzis</surname>
            <given-names>Suzanne</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9762-030X</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Fay</surname>
            <given-names>Emily E</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5582-2835</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Gallagher</surname>
            <given-names>Thomas H</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8323-1450</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Mazor</surname>
            <given-names>Kathleen M</given-names>
          </name>
          <degrees>EdD</degrees>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9491-9872</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Medicine</institution>
        <institution>University of Washington School of Medicine</institution>
        <addr-line>Seattle, WA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>National Board of Medical Examiners</institution>
        <addr-line>Philadelphia, PA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Collaborative for Accountability and Improvement</institution>
        <institution>University of Washington</institution>
        <addr-line>Seattle, WA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of Pathology</institution>
        <institution>University of Washington School of Medicine</institution>
        <addr-line>Seattle, WA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Department of Obstetrics and Gynecology</institution>
        <institution>University of Washington School of Medicine</institution>
        <addr-line>Seattle, WA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Department of Bioethics and Humanities</institution>
        <institution>University of Washington</institution>
        <addr-line>Seattle, WA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>Meyers Primary Care Institute</institution>
        <institution>University of Massachusetts Medical School</institution>
        <addr-line>Worcester, MA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Andrew A White <email>andwhite@uw.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <season>Apr-Jun</season>
        <year>2022</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>29</day>
        <month>4</month>
        <year>2022</year>
      </pub-date>
      <volume>8</volume>
      <issue>2</issue>
      <elocation-id>e30988</elocation-id>
      <history>
        <date date-type="received">
          <day>27</day>
          <month>6</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>4</day>
          <month>2</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>19</day>
          <month>2</month>
          <year>2022</year>
        </date>
        <date date-type="accepted">
          <day>31</day>
          <month>3</month>
          <year>2022</year>
        </date>
      </history>
      <copyright-statement>©Andrew A White, Ann M King, Angelo E D’Addario, Karen Berg Brigham, Suzanne Dintzis, Emily E Fay, Thomas H Gallagher, Kathleen M Mazor. Originally published in JMIR Medical Education (https://mededu.jmir.org), 29.04.2022.</copyright-statement>
      <copyright-year>2022</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Education, is properly cited. The complete bibliographic information, a link to the original publication on https://mededu.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://mededu.jmir.org/2022/2/e30988" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Residents may benefit from simulated practice with personalized feedback to prepare for high-stakes disclosure conversations with patients after harmful errors and to meet American Council on Graduate Medical Education mandates. Ideally, feedback would come from patients who have experienced communication after medical harm, but medical researchers and leaders have found it difficult to reach this community, which has made this approach impractical at scale. The Video-Based Communication Assessment app is designed to engage crowdsourced laypeople to rate physician communication skills but has not been evaluated for use with medical harm scenarios.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>We aimed to compare the reliability of 2 assessment groups (crowdsourced laypeople and patient advocates) in rating physician error disclosure communication skills using the Video-Based Communication Assessment app.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Internal medicine residents used the Video-Based Communication Assessment app; the case, which consisted of 3 sequential vignettes, depicted a delayed diagnosis of breast cancer. Panels of patient advocates who have experienced harmful medical error, either personally or through a family member, and crowdsourced laypeople used a 5-point scale to rate the residents’ error disclosure communication skills (6 items) based on audiorecorded responses. Ratings were aggregated across items and vignettes to create a numerical communication score for each physician. We used analysis of variance, to compare stringency, and Pearson correlation between patient advocates and laypeople, to identify whether rank order would be preserved between groups. We used generalizability theory to examine the difference in assessment reliability between patient advocates and laypeople.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Internal medicine residents (n=20) used the Video-Based Communication Assessment app. All patient advocates (n=8) and 42 of 59 crowdsourced laypeople who had been recruited provided complete, high-quality ratings. Patient advocates rated communication more stringently than crowdsourced laypeople (patient advocates: mean 3.19, SD 0.55; laypeople: mean 3.55, SD 0.40; <italic>P</italic>&#60;.001), but patient advocates’ and crowdsourced laypeople’s ratings of physicians were highly correlated (<italic>r</italic>=0.82, <italic>P</italic>&#60;.001). Reliability for 8 raters and 6 vignettes was acceptable (patient advocates: G coefficient 0.82; crowdsourced laypeople: G coefficient 0.65). Decision studies estimated that 12 crowdsourced layperson raters and 9 vignettes would yield an acceptable G coefficient of 0.75.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Crowdsourced laypeople may represent a sustainable source of reliable assessments of physician error disclosure skills. For a simulated case involving delayed diagnosis of breast cancer, laypeople correctly identified high and low performers. However, at least 12 raters and 9 vignettes are required to ensure adequate reliability and future studies are warranted. Crowdsourced laypeople rate less stringently than raters who have experienced harm. Future research should examine the value of the Video-Based Communication Assessment app for formative assessment, summative assessment, and just-in-time coaching of error disclosure communication skills.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>medical error disclosure</kwd>
        <kwd>simulation studies</kwd>
        <kwd>communication assessment</kwd>
        <kwd>graduate medical education</kwd>
        <kwd>crowdsourcing</kwd>
        <kwd>patient-centered care</kwd>
        <kwd>generalizability theory</kwd>
        <kwd>medical education</kwd>
        <kwd>medical error</kwd>
        <kwd>communication</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Poor communication after a medical injury often leaves patients and families feeling alone, afraid, confused, and more likely to seek redress through malpractice claims [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. One cause of this communication gap cited by both practicing and resident physicians is inadequate training on disclosing harmful medical errors [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. Recently, communication and resolution programs have emerged as a framework to enable clinicians and health care institutions to communicate openly with patients and families, apologize, and offer compensation if an error contributed to patient harm [<xref ref-type="bibr" rid="ref5">5</xref>]. Communication and resolution programs require clinicians, institutional leaders, and liability insurers to collaborate to provide transparent communication and emotional support for harmed patients. Communication and resolution programs align with recent American Council on Graduate Medical Education mandates that require all trainees to participate in real or simulated disclosure of harm events [<xref ref-type="bibr" rid="ref6">6</xref>]. However, organizations adopting communication and resolution programs may struggle to prepare physicians for these difficult conversations, in part because of challenges in assessing and improving the specific communication skills required [<xref ref-type="bibr" rid="ref7">7</xref>].</p>
      <p>Traditional methods of assessing physician communication are not suitable for this particular type of task. For example, patient surveys can evaluate actual performance on routine communication, but individual physicians disclose harmful errors infrequently, and these high-stakes discussions are difficult to observe or record. As an alternative to real-world practice, educators often use standardized patients (individuals trained to act as a real patient) and simulated encounters for formative and summative assessments [<xref ref-type="bibr" rid="ref8">8</xref>]. However, standardized patient exams are logistically intensive, expensive to implement at scale, and lack statistical reliability [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref12">12</xref>]. In addition, it is unknown whether standardized patients or peer physician raters adequately approximate the viewpoint of patients who have experienced medical injury. In particular, physicians’ viewpoints about ideal disclosure content and performance differ from those of patients, which limits physicians’ abilities to assess and coach other physicians’ performance [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. Although feedback would ideally come from harmed patients, researchers have found it difficult to reach this community because providers are reluctant to release details about harmed patients, and because patients hesitate to revisit painful events [<xref ref-type="bibr" rid="ref15">15</xref>]. To make progress, educators and communication and resolution program leaders need a cost-effective and standardized assessment tool that provides actionable, on-demand, high-volume, and patient-centered feedback about physician communication skills after harm.</p>
      <p>The National Board of Medical Examiners recently developed the Video-Based Communication Assessment app as an efficient approach to producing timely, specific, and individual feedback about verbal communication [<xref ref-type="bibr" rid="ref16">16</xref>]. The Video-Based Communication Assessment app displays brief videos of case vignettes and asks users to audiorecord what they would say next to the patient [<xref ref-type="bibr" rid="ref17">17</xref>]. Recorded responses are rated by web-based panels of analog patients. Analog patients are untrained raters given the task of listening to and rating their impressions of a medical interaction while assuming the patient perspective [<xref ref-type="bibr" rid="ref18">18</xref>]. Analog patients are typically laypeople recruited via MTurk [<xref ref-type="bibr" rid="ref19">19</xref>]; MTurk provides access to a very large, diverse population for survey research, and there is extensive proof that MTurk is an inexpensive, rapid, and high-quality data source [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. Users then receive feedback reports with their individual ratings, comparative data on the user’s cohort, learning points derived from analysis of crowdsourced raters’ comments, and selected highly rated responses from peers. The only study [<xref ref-type="bibr" rid="ref22">22</xref>] of the Video-Based Communication Assessment app published to date used a variety of 16 typical primary care communication scenarios and found that crowdsourced laypeople can provide high-quality, actionable feedback regarding physician communication skills. Key steps in evaluating the Video-Based Communication Assessment app for error disclosure skill assessment are understanding reliability, educational outcomes, and adoption challenges.</p>
      <p>Our aim was to evaluate the reliability of crowdsourced laypeople as raters by comparing their ratings with those of patient advocates who had experienced harm in the course of in their own or a loved one’s medical care. We hypothesized that crowdsourced layperson raters could provide reliable ratings of this specific communication skill, given sufficient panel size.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Overview</title>
        <p>This descriptive study is part of a larger project to develop instruments for assessing resident error disclosure skills. With input from experienced attending physicians, we designed and pilot-tested 4 cases specific to the practice of internal medicine. Each case consisted of 3 or 4 vignettes depicting sequential stages in a conversation (for example, initially sharing information about a mistake, responding to a patient’s emotional reaction). We recruited resident physicians at an academic center to use the Video-Based Communication Assessment app. Physicians’ disclosure skills were rated by crowdsourced laypeople recruited on MTurk (Mechanical Turk; Amazon) and by a panel of patient advocates.</p>
      </sec>
      <sec>
        <title>Participants</title>
        <p>We recruited resident physicians in postgraduate years 1 through 3 from the University of Washington academic medical center. We invited all 183 internal medicine residents by email and provided dedicated participation time at a program-wide web-based educational conference (approximate attendance: 40 residents). Residents received a 10-minute orientation to the Video-Based Communication Assessment app and were given class time to participate. Participation was optional. Participants were randomly assigned to 1 of 2 pairs of initial cases to counteract order effects, using a crossover design (<xref rid="figure1" ref-type="fig">Figure 1</xref>). After receiving a feedback report, residents were eligible to complete the second 2 cases on their own. Participating residents received a $50 gift card after completing all 4 cases during a 2-month period; however, only 1 case was used in this study.</p>
        <p>We used the following inclusion criteria for laypeople: resident of the United States, 18 years or older, and able to speak and read English. Patient advocates were recruited through advertisements with the Patient and Family Advocate Committee of the Collaborative for Accountability and Improvement (a network of health care leaders, attorneys, insurers, and patient advocates who support the development and widespread application of communication and resolution programs). Patient advocates were recruited if they met the following criteria: resident of the United States, 18 years or older, able to speak and read English, not currently or previously employed in health care, and having a personal history of having experienced serious medical injury in their own care or that of a family member. Patient advocates received a US $200 gift card for participation. Crowdsourced raters received variable amounts based on a rate of $0.20 per rating. A crowdsourced rater performing the same total number of ratings as a patient advocate would have received $12.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Crossover study design for 21 internal medicine residents using the Video-Based Communication Assessment app at study start (time 1) and approximately 4 weeks later (time 2).  The study case in the blue box (breast cancer misdiagnosis) was selected for further study.</p>
          </caption>
          <graphic xlink:href="mededu_v8i2e30988_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Ethics</title>
        <p>The University of Washington Institutional Review Board determined that this study was exempt from review for resident, layperson, and patient advocate participants based on its policies, procedures, and guidance [<xref ref-type="bibr" rid="ref23">23</xref>].</p>
      </sec>
      <sec>
        <title>Video-Based Communication Assessment App</title>
        <p>The concept and software of the Video-Based Communication Assessment app have been previously described [<xref ref-type="bibr" rid="ref16">16</xref>]. The app was used to present vignettes, record user responses, and deliver feedback reports (<xref rid="figure2" ref-type="fig">Figure 2</xref>). Instead of a single stand-alone vignette, in this study, cases consisted of a linked series of 3 or 4 vignettes to simulate an unfolding conversation. Because a live conversation might not progress in the same manner or sequence, each vignette after the first was accompanied by text declaring what the patient understood at that point.</p>
        <p>We used a case that depicted harm resulting from a delayed diagnosis of breast cancer, which is discovered by a primary care doctor just before the patient returns for an office visit (<xref ref-type="table" rid="table1">Table 1</xref>). This case was chosen because it has 3 segments, rather than 4, which reduced the time and cognitive demands imposed on the small group of patient advocates.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Screenshot from the Video-Based Communication Assessment app displaying a case of delayed diagnosis of breast cancer and the user controls for playing the vignette video and making an audio response to the patient.</p>
          </caption>
          <graphic xlink:href="mededu_v8i2e30988_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Text and scenario (spoken by actors in 3 linked vignettes) presented to users (physicians) and raters (laypeople and patient advocates).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="80"/>
            <col width="320"/>
            <col width="300"/>
            <col width="300"/>
            <thead>
              <tr valign="top">
                <td>Vignette</td>
                <td>Situation description (to physician)</td>
                <td>Situation Description (to rater)</td>
                <td>What the patient says</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>You are a primary care doctor for a 48-year-old woman with diabetes. Today she mentions a breast lump that is new to her. You review her chart and see a mammogram report from last year had a suspicious calcification with recommendation for biopsy. At her last health maintenance visit you did not document a plan for the result and do not recall seeing it before now. You examine her and the site of the lump corresponds to the location on x-ray. She says:</td>
                <td>Lorna Smith visits her primary care doctor to evaluate a new breast lump. She figures it isn't anything serious because she had a mammogram last year and never heard about any abnormal results. The doctor examined her and she changed back to regular clothes. She wants to discuss the lump now and says:</td>
                <td>“When I didn’t hear from your office about the mammogram, I assumed everything was normal. Was there any sign of this lump on the test last year?”</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>You've told the patient that there were early warning signs of possible breast cancer on her mammogram one year ago. She says:</td>
                <td>Lorna has learned that her mammogram last year showed early signs of possible breast cancer, but nothing was done about it. She is feeling panicked and says:</td>
                <td>“This is terrible! I’ve never been more frightened…plus you’re telling me that we might have known about it a long time ago!”</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>You've acknowledged how upsetting the error is. The patient now understands that there were early warning signs of possible breast cancer on her mammogram. She says:</td>
                <td>Lorna feels like the clinic and her doctor have failed her. She asks:</td>
                <td>“How could this happen to me? I feel like I can’t trust anyone anymore. How am I supposed to believe your advice in the future?”<break/>  <break/>  </td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Data Collection</title>
        <p>Resident physicians participated in the video-based communication assessment and provided audio responses to each vignette. All audio responses to a single case were bundled into rating tasks for the raters, comprising 4 physicians’ responses to a case. Raters first completed an audio check and answered questions about demographic characteristics. Raters were asked to read the description of the vignette, view the patient video, listen to each vignette, and rate 6 items (<xref ref-type="table" rid="table2">Table 2</xref>). Due to the sequential design, we removed raters who did not complete all ratings. We also removed raters who used 2 or fewer response items on the 5-item survey because this may be a sign of inattention and poor rater quality [<xref ref-type="bibr" rid="ref24">24</xref>]. We defined outliers as raters who reduced the interrater reliability of their task by 0.1 or more.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Items to assess error disclosure communication skills.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="560"/>
            <col width="440"/>
            <thead>
              <tr valign="top">
                <td>Item</td>
                <td>Response options</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Overall this provider’s response was</td>
                <td>Poor, fair, good, very, good, or excellent</td>
              </tr>
              <tr valign="top">
                <td>I would feel this provider was accountable for their actions</td>
                <td>Not at all, a little, somewhat, very much, or completely</td>
              </tr>
              <tr valign="top">
                <td>I would feel this provider was being honest about what happened</td>
                <td>Not at all, a little, somewhat, very much, or completely</td>
              </tr>
              <tr valign="top">
                <td>I would feel this provider was sincerely sorry for what happened</td>
                <td>Not at all, a little, somewhat, very much, or completely</td>
              </tr>
              <tr valign="top">
                <td>I would feel the provider understood how I was feeling</td>
                <td>Not at all, a little, somewhat, very much, or completely</td>
              </tr>
              <tr valign="top">
                <td>I would feel this provider cared about me</td>
                <td>Not at all, a little, somewhat, very much, or completely</td>
              </tr>
              <tr valign="top">
                <td>What would you want the provider to say if you were the patient in this situation?</td>
                <td>Free text</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Analysis</title>
        <p>To create vignette-level scores, ratings were aggregated across all items for each vignette. To compare stringency between groups, we employed a 3×2 repeated measures factorial analysis of variance for vignette (1, 2, 3) and rater (patient advocate, crowdsourced layperson). To create overall assessment scores, we aggregated all vignette-level scores for each user (these continuous scores were derived from ordinal approximations of continuous variables, ie, the mean of Likert-scale responses [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]). To determine if an individual physician’s score would be preserved between groups in relation to their peers, we calculated the Pearson correlation.</p>
        <p>Generalizability theory utilizes analysis of variance to parse multiple sources of measurement error and estimate reliability under specific conditions [<xref ref-type="bibr" rid="ref27">27</xref>]. A generalizability analysis was conducted using GENOVA (version 2.1; University of Iowa) to compute variance components for a fully crossed design utilizing a panel of patient advocates [<xref ref-type="bibr" rid="ref28">28</xref>]. A separate generalizability analysis was conducted using urGENOVA (version 2.1; University of Iowa) to generate variance components for an unbalanced design utilizing crowdsourced layperson raters [<xref ref-type="bibr" rid="ref29">29</xref>]. In order to determine the optimal design to achieve sufficient reliability, the estimated variance components were used to conduct multiple decision studies to produce G coefficients corresponding to varying numbers of vignettes and raters for each design.</p>
      </sec>
      <sec>
        <title>Patient Advocate Design</title>
        <p>To balance consistency and attention span, patient advocates rated batches of 7 physician responses at a time. Batches were block randomized and consisted of physicians’ audio responses to all 3 vignettes. In G-theory, this is referred to as fully crossed design—physician crossed with vignette crossed with rater (p × v × λ).</p>
      </sec>
      <sec>
        <title>Crowdsourced Layperson Design</title>
        <p>Crowdsourced laypeople rated a subset of the physicians. Each crowdsourced layperson rated a single batch of 4 physician responses (all 3 vignettes). In G-theory, this is referred to as a rater nested within physician crossed with vignette ((λ:p) × v) design.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Participant Demographics</title>
        <p>Although 21 internal medicine physicians completed all 3 vignettes, one physician was omitted from analyses because of incomplete ratings); therefore, 20 physicians (male: 6/20, 30%; female: 14/20, 70%), with total of 60 audiorecordings, were rated. The patient advocate panel (n=8; male: 2/8, 25%; female: 6/8,75%) had a median age of 57 years (IQR 53-74.3). Patient advocates reported that it took an average of 116 minutes (SD 62) to rate all 20 cases. A total of 59 crowdsourced laypeople were recruited, but 8 were removed because they did not rate all 3 vignettes in the case, 8 were removed for utilizing 2 or fewer response items, and 1 was deemed to be an outlier; thus, 42 crowdsourced layperson raters were included. Of the 42 crowdsourced raters, 16 (38%) were female; 20 individuals (48%) were between 18 and 34 years old, and 22 (52%) individuals were between 35 and 64 years old.</p>
      </sec>
      <sec>
        <title>Comparing Crowdsourced Laypeople and Patient Advocates:</title>
        <p>There was a significant overall main effect for rater (<italic>F</italic><sub>1,19</sub>=24.14, <italic>P</italic>&#60;.001, <italic>d</italic>=0.75)—patient advocates (mean 3.19, SD 0.55) rated communication more stringently than crowdsourced laypeople (mean 3.55, SD 0.40) (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> and <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). Patient advocate ratings were strongly correlated with crowdsourced layperson ratings (<italic>r</italic>=0.82, <italic>P</italic>&#60;.001) (<xref rid="figure3" ref-type="fig">Figure 3</xref>).</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Correlation between ratings of overall communication skill for resident physicians generated by panels of patient advocates and crowdsourced laypeople.</p>
          </caption>
          <graphic xlink:href="mededu_v8i2e30988_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Generalizability</title>
        <p>Generalizability analysis yielded the variance attributable to each component (<xref ref-type="table" rid="table3">Table 3</xref>). The G coefficients for 8 raters and 3 vignettes were 0.7 for patient advocates and 0.6 for crowdsourced laypeople. Maintaining 8 raters and increasing the task to 6 vignettes would increase the G coefficients (patient advocates: 0.82; crowdsourced laypeople: 0.65). Increasing the panels to 12 raters for 6 vignettes would increase the G coefficients (patient advocates: 0.83; crowdsourced laypeople: 0.72). Using 12 raters and 9 vignettes would yield G coefficients of 0.88 and 0.75 for patient advocates and crowdsourced laypeople, respectively (<xref rid="figure4" ref-type="fig">Figure 4</xref>).</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Generalizability study variance components.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="340"/>
            <col width="0"/>
            <col width="300"/>
            <col width="0"/>
            <col width="330"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Source of variance</td>
                <td colspan="2">Variance component</td>
                <td>Variance percentage</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">
                  <bold>Patient advocates (p × v ×</bold>
                  <bold>λ</bold>
                  <bold>design)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Physician</td>
                <td colspan="2">0.214</td>
                <td colspan="2">17.979</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Rater</td>
                <td colspan="2">0.311</td>
                <td colspan="2">26.105</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Vignette</td>
                <td colspan="2">0.017</td>
                <td colspan="2">1.421</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Physician × rater</td>
                <td colspan="2">0.008</td>
                <td colspan="2">0.690</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Physician × vignette</td>
                <td colspan="2">0.210</td>
                <td colspan="2">17.586</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Rater × vignette</td>
                <td colspan="2">0.012</td>
                <td colspan="2">0.986</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Residual</td>
                <td colspan="2">0.420</td>
                <td colspan="2">35.232</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Crowdsourced laypeople ((λ:p) × v design)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Physician</td>
                <td colspan="2">0.121</td>
                <td colspan="2">14.564</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Vignette</td>
                <td colspan="2">0.007</td>
                <td colspan="2">0.906</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Rater:physician</td>
                <td colspan="2">0.368</td>
                <td colspan="2">44.402</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Physician × vignette</td>
                <td colspan="2">0.074</td>
                <td colspan="2">8.952</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Residual</td>
                <td colspan="2">0.258</td>
                <td colspan="2">31.177</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Reliability (G coefficient) models for panels of patient advocates and crowdsourced laypeople, by panel size and number of vignettes rated per user.</p>
          </caption>
          <graphic xlink:href="mededu_v8i2e30988_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Patient advocates rated communication skills more stringently than crowdsourced laypeople, but the correlation between patient advocates’ ratings and crowdsourced laypeople’s ratings was high. Patient advocates also had higher reliability, but decision studies estimated that panels of crowdsourced laypeople could achieve a G coefficient of 0.75 with 12 raters and 9 vignettes.</p>
        <p>These findings demonstrate that crowdsourced laypeople can reliably rate the error disclosure communication skills of physicians using the Video-Based Communication Assessment app. This is encouraging for communication and resolution program leaders and graduate medical educators who require an abundant and affordable pool of raters to support personalized feedback processes in the next generation of physician communication skill training programs. In principle, patient advocates would offer the best possible feedback, but large-scale training efforts would rapidly exhaust the willing and available patient advocate population, given the amount of time that these raters reported spending on this study. Instead, crowdsourced laypeople represent a large and sustainable pool of on-demand raters. Nonetheless, our finding that approximately one-third of crowdsourced laypeople (17/59, 29%) must be removed from analysis to optimize assessment reliability indicates that continuous rater performance monitoring, requirements for raters to complete all vignettes in a series, and a sufficient number of raters would be required for widespread deployment of the Video-Based Communication Assessment app in error disclosure training.</p>
        <p>Educators who use the Video-Based Communication Assessment app should understand how crowdsourced raters differ from patient advocates, who represent the gold standard for informed assessment of physician error disclosure skills. Compared with crowdsourced individuals, patient advocates can achieve high reliability with smaller panel sizes and fewer vignettes per physician. This suggests that patient advocates have a common concept of the components of verbal communication that affect the quality of error disclosure and are highly attuned to differences among physicians. Of note, patient advocates assigned lower ratings to resident error disclosure communication than crowdsourced laypeople did. Educators and coaches should recognize that overall scores from crowdsourced laypeople are potentially more generous than those of patients who have experienced harm from medical errors and should note this in reviewing feedback with residents.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>The Video-Based Communication Assessment app had been previously only used with groups of stand-alone vignettes [<xref ref-type="bibr" rid="ref22">22</xref>], but this is the first example of a case with sequential vignettes that simulate a longer conversation. The satisfactory reliability should encourage educators to develop cases for other extended exchanges, such as discussions about goals of care, shared decision-making, or new diagnoses of serious illness. However, our need to sacrifice a subset of ratings by crowdsourced laypeople who had not completed all of the vignettes within a case suggests that longer cases would benefit from a modified approach, such as the use of attention checks or restrictions (eg, a high past task acceptance ratio) [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>]</p>
        <p>Although physician educators have been used to evaluate trainee disclosure skills in a prior study [<xref ref-type="bibr" rid="ref7">7</xref>], our findings suggest that using faculty as raters would be too costly for large training programs. Based on the time estimates in this study, a residency program with 60 residents, each completing 4 cases, would require an educator to allocate approximately 23 hours to listening and rating audio. Rather than finding 6 to 8 faculty to do this task for a single training session, crowdsourcing laypeople appears to be a more viable and rapid solution.</p>
      </sec>
      <sec>
        <title>Future Directions</title>
        <p>This study sets the stage for investigation of use of the Video-Based Communication Assessment app for error disclosure training, for example, for formative assessment (either for self-directed improvement or in conjunction with coaching from a teacher) or summative assessment and in the identification of struggling learners. Although we did not define a threshold for competency, low performers might warrant additional support from residency leaders, including attention on communication performance in other scenarios. Additional areas to explore include whether the tool can be used in undergraduate medical education, continuing medical education, or in just-in-time scenarios (for physicians to practice and receive feedback just before real-life error disclosure). Future studies should investigate the role of different error types (eg, diagnostic or therapeutic), harm severity, physician and patient identity (eg, gender, race), tone, and accent on ratings. The Video-Based Communication Assessment app could be used to understand the efficacy of training interventions and to study the natural history of communication skill development over time. Finally, future studies should also investigate whether error disclosure performance using the Video-Based Communication Assessment app is associated with other safety behaviors encouraged by communication and resolution programs, such as event reporting, root cause analysis, or physician participation in system redesign to prevent future errors.</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <p>Our work has limitations. We did not assess whether crowdsourced laypeople had personal experience with medical harm and did not measure the amount of time crowdsourced laypeople spent on this evaluation task. Additionally, we recruited patient advocates through their involvement in a national advocacy organization, and their rating behaviors may not generalize to the broader community of patients who have been harmed by care. The convenience sample of patient advocates was not age- and gender-matched to the sample of crowdsourced individuals, and age was not collected as a continuous variable for crowdsourced individuals. The Video-Based Communication Assessment app does not measure nonverbal communication skills, which play an essential role in communication about medical error [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>]. Finally, this study was conducted using a single case with a breast cancer misdiagnosis and tested with medical residents and may, therefore, not be generalizable to other uses—other unique patient scenarios may require separate validation of crowdsourced laypeople as analog patients. Future research should aim to replicate findings with a more robust sample size.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>Crowdsourced laypeople reliably rated error disclosure skills using the Video-Based Communication Assessment app, although reliably distinguishing high and low performers would require larger panels (9-12 raters) and more vignettes per examinee (9 or more). Fortunately, this is readily achievable in error disclosure curricula. Future studies should focus on the educational outcomes achieved by presenting analog patient feedback to resident physicians about their error disclosure communication skills, and the role of the Video-Based Communication Assessment app in other learner groups or just-in-time scenarios.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Deidentified data of ratings by patient advocates for residents (user) and vignettes (v1,v2,v3).</p>
        <media xlink:href="mededu_v8i2e30988_app1.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 14 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Deidentified data of ratings by crowdsourced laypeople for residents (user) and vignettes (v1,v2,v3).</p>
        <media xlink:href="mededu_v8i2e30988_app2.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 14 KB"/>
      </supplementary-material>
    </app-group>
    <ack>
      <p>We thank Anders Chen, MD, and Kevin Blau, MD, for their assistance with study enrollment. The study was funded by the University of Washington’s Patient Safety Innovations Program. The funder had no role in the study design or manuscript review.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gallagher</surname>
              <given-names>TH</given-names>
            </name>
            <name name-style="western">
              <surname>Garbutt</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Waterman</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Flum</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Larson</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>Waterman</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Dunagan</surname>
              <given-names>WC</given-names>
            </name>
            <name name-style="western">
              <surname>Fraser</surname>
              <given-names>VJ</given-names>
            </name>
            <name name-style="western">
              <surname>Levinson</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Choosing your words carefully: how physicians would disclose harmful medical errors to patients</article-title>
          <source>Arch Intern Med</source>
          <year>2006</year>
          <volume>166</volume>
          <issue>15</issue>
          <fpage>1585</fpage>
          <lpage>93</lpage>
          <pub-id pub-id-type="doi">10.1001/archinte.166.15.1585</pub-id>
          <pub-id pub-id-type="medline">16908791</pub-id>
          <pub-id pub-id-type="pii">166/15/1585</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Delbanco</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>SK</given-names>
            </name>
          </person-group>
          <article-title>Guilty, afraid, and alone--struggling with medical error</article-title>
          <source>N Engl J Med</source>
          <year>2007</year>
          <month>10</month>
          <day>25</day>
          <volume>357</volume>
          <issue>17</issue>
          <fpage>1682</fpage>
          <lpage>3</lpage>
          <pub-id pub-id-type="doi">10.1056/NEJMp078104</pub-id>
          <pub-id pub-id-type="medline">17960011</pub-id>
          <pub-id pub-id-type="pii">357/17/1682</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>White</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Krauss</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Garbutt</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dunagan</surname>
              <given-names>WC</given-names>
            </name>
            <name name-style="western">
              <surname>Fraser</surname>
              <given-names>VJ</given-names>
            </name>
            <name name-style="western">
              <surname>Levinson</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Larson</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>Gallagher</surname>
              <given-names>TH</given-names>
            </name>
          </person-group>
          <article-title>How trainees would disclose medical errors: educational implications for training programmes</article-title>
          <source>Med Educ</source>
          <year>2011</year>
          <month>04</month>
          <volume>45</volume>
          <issue>4</issue>
          <fpage>372</fpage>
          <lpage>80</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21401685"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/j.1365-2923.2010.03875.x</pub-id>
          <pub-id pub-id-type="medline">21401685</pub-id>
          <pub-id pub-id-type="pmcid">PMC3501535</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gallagher</surname>
              <given-names>TH</given-names>
            </name>
            <name name-style="western">
              <surname>Waterman</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Garbutt</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Kapp</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>DK</given-names>
            </name>
            <name name-style="western">
              <surname>Dunagan</surname>
              <given-names>WC</given-names>
            </name>
            <name name-style="western">
              <surname>Fraser</surname>
              <given-names>VJ</given-names>
            </name>
            <name name-style="western">
              <surname>Levinson</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>US and Canadian physicians' attitudes and experiences regarding disclosing errors to patients</article-title>
          <source>Arch Intern Med</source>
          <year>2006</year>
          <volume>166</volume>
          <issue>15</issue>
          <fpage>1605</fpage>
          <lpage>11</lpage>
          <pub-id pub-id-type="doi">10.1001/archinte.166.15.1605</pub-id>
          <pub-id pub-id-type="medline">16908793</pub-id>
          <pub-id pub-id-type="pii">166/15/1605</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mello</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Kachalia</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Roche</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Niel</surname>
              <given-names>MV</given-names>
            </name>
            <name name-style="western">
              <surname>Buchsbaum</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dodson</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Folcarelli</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Benjamin</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Sands</surname>
              <given-names>KE</given-names>
            </name>
          </person-group>
          <article-title>Outcomes in two Massachusetts hospital systems give reason for optimism about communication-and-resolution programs</article-title>
          <source>Health Aff (Millwood)</source>
          <year>2017</year>
          <month>10</month>
          <day>01</day>
          <volume>36</volume>
          <issue>10</issue>
          <fpage>1795</fpage>
          <lpage>1803</lpage>
          <pub-id pub-id-type="doi">10.1377/hlthaff.2017.0320</pub-id>
          <pub-id pub-id-type="medline">28971925</pub-id>
          <pub-id pub-id-type="pii">36/10/1795</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="web">
          <article-title>ACGME common program requirements (residency): section VI.A.1.a</article-title>
          <source>Accreditation Council for Graduate Medical Education</source>
          <access-date>2022-02-11</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.acgme.org/Portals/0/PFAssets/ProgramRequirements/CPRResidency2019.pdf">http://www.acgme.org/Portals/0/PFAssets/ProgramRequirements/CPRResidency2019.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stroud</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Hollenberg</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Levinson</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Teaching medical error disclosure to physicians-in-training: a scoping review</article-title>
          <source>Acad Med</source>
          <year>2013</year>
          <month>06</month>
          <volume>88</volume>
          <issue>6</issue>
          <fpage>884</fpage>
          <lpage>92</lpage>
          <pub-id pub-id-type="doi">10.1097/ACM.0b013e31828f898f</pub-id>
          <pub-id pub-id-type="medline">23619064</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Scalese</surname>
              <given-names>RJ</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Holmboe</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Durning</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hawkins</surname>
              <given-names>RE</given-names>
            </name>
          </person-group>
          <article-title>Simulation-based assessment</article-title>
          <source>Evaluation of Clinical Competence</source>
          <year>2018</year>
          <publisher-loc>Amsterdam</publisher-loc>
          <publisher-name>Elsevier</publisher-name>
          <fpage>215</fpage>
          <lpage>255</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stroud</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>McIlroy</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Levinson</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Skills of internal medicine residents in disclosing medical errors: a study using standardized patients</article-title>
          <source>Acad Med</source>
          <year>2009</year>
          <month>12</month>
          <volume>84</volume>
          <issue>12</issue>
          <fpage>1803</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1097/ACM.0b013e3181bf9fef</pub-id>
          <pub-id pub-id-type="medline">19940591</pub-id>
          <pub-id pub-id-type="pii">00001888-200912000-00033</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Patrício</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Julião</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fareleira</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Carneiro</surname>
              <given-names>AV</given-names>
            </name>
          </person-group>
          <article-title>Is the OSCE a feasible tool to assess competencies in undergraduate medical education?</article-title>
          <source>Med Teach</source>
          <year>2013</year>
          <month>06</month>
          <volume>35</volume>
          <issue>6</issue>
          <fpage>503</fpage>
          <lpage>14</lpage>
          <pub-id pub-id-type="doi">10.3109/0142159X.2013.774330</pub-id>
          <pub-id pub-id-type="medline">23521582</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adamo</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Simulated and standardized patients in OSCEs: achievements and challenges 1992-2003</article-title>
          <source>Med Teach</source>
          <year>2003</year>
          <month>05</month>
          <volume>25</volume>
          <issue>3</issue>
          <fpage>262</fpage>
          <lpage>70</lpage>
          <pub-id pub-id-type="doi">10.1080/0142159031000100300</pub-id>
          <pub-id pub-id-type="medline">12881047</pub-id>
          <pub-id pub-id-type="pii">A0AJ10QHMC0U345G</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jacobs</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>van Jaarsveldt</surname>
              <given-names>DE</given-names>
            </name>
          </person-group>
          <article-title>'The character rests heavily within me': drama students as standardized patients in mental health nursing education</article-title>
          <source>J Psychiatr Ment Health Nurs</source>
          <year>2016</year>
          <month>04</month>
          <volume>23</volume>
          <issue>3-4</issue>
          <fpage>198</fpage>
          <lpage>206</lpage>
          <pub-id pub-id-type="doi">10.1111/jpm.12302</pub-id>
          <pub-id pub-id-type="medline">27090349</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Martinez</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Browning</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Varrin</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sarnoff Lee</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>SK</given-names>
            </name>
          </person-group>
          <article-title>Increasing patient-clinician concordance about medical error disclosure through the patient TIPS model</article-title>
          <source>J Patient Saf</source>
          <year>2019</year>
          <month>12</month>
          <volume>15</volume>
          <issue>4</issue>
          <fpage>305</fpage>
          <lpage>307</lpage>
          <pub-id pub-id-type="doi">10.1097/PTS.0000000000000284</pub-id>
          <pub-id pub-id-type="medline">28492422</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gallagher</surname>
              <given-names>TH</given-names>
            </name>
          </person-group>
          <article-title>A 62-year-old woman with skin cancer who experienced wrong-site surgery: review of medical error</article-title>
          <source>JAMA</source>
          <year>2009</year>
          <month>08</month>
          <day>12</day>
          <volume>302</volume>
          <issue>6</issue>
          <fpage>669</fpage>
          <lpage>77</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2009.1011</pub-id>
          <pub-id pub-id-type="medline">19584321</pub-id>
          <pub-id pub-id-type="pii">2009.1011</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Iedema</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Britton</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Piper</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Baker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Grbich</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Allan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tuckett</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Manias</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Gallagher</surname>
              <given-names>TH</given-names>
            </name>
          </person-group>
          <article-title>Patients' and family members' views on how clinicians enact and how they should enact incident disclosure: the "100 patient stories" qualitative study</article-title>
          <source>BMJ</source>
          <year>2011</year>
          <month>07</month>
          <day>25</day>
          <volume>343</volume>
          <fpage>d4423</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21788260"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.d4423</pub-id>
          <pub-id pub-id-type="medline">21788260</pub-id>
          <pub-id pub-id-type="pmcid">PMC3142870</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mazor</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>King</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Hoppe</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Kochersberger</surname>
              <given-names>AO</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Reim</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <article-title>Video-based communication assessment: development of an innovative system for assessing clinician-patient communication</article-title>
          <source>JMIR Med Educ</source>
          <year>2019</year>
          <month>02</month>
          <day>14</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>e10400</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.2196/10400"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/10400</pub-id>
          <pub-id pub-id-type="medline">30710460</pub-id>
          <pub-id pub-id-type="pii">v5i1e10400</pub-id>
          <pub-id pub-id-type="pmcid">PMC6393776</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>National Board of Medical Examiners</collab>
          </person-group>
          <article-title>Introducing the VCA</article-title>
          <source>YouTube</source>
          <access-date>2022-02-11</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.youtube.com/watch?v=ZqdZKVk7aak">https://www.youtube.com/watch?v=ZqdZKVk7aak</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blanch-Hartigan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Krupat</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Irish</surname>
              <given-names>JT</given-names>
            </name>
          </person-group>
          <article-title>Can naive viewers put themselves in the patients' shoes?: reliability and validity of the analogue patient methodology</article-title>
          <source>Med Care</source>
          <year>2013</year>
          <month>03</month>
          <volume>51</volume>
          <issue>3</issue>
          <fpage>e16</fpage>
          <lpage>21</lpage>
          <pub-id pub-id-type="doi">10.1097/MLR.0b013e31822945cc</pub-id>
          <pub-id pub-id-type="medline">22498688</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sheehan</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Crowdsourcing research: Data collection with Amazon’s Mechanical Turk</article-title>
          <source>Communication Monographs</source>
          <year>2018</year>
          <volume>85</volume>
          <issue>1</issue>
          <fpage>140</fpage>
          <lpage>156</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1080/03637751.2017.1342043"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/03637751.2017.1342043</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Buhrmester</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kwang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gosling</surname>
              <given-names>SD</given-names>
            </name>
          </person-group>
          <article-title>Amazon's Mechanical Turk: a new source of inexpensive, yet high-quality, data?</article-title>
          <source>Perspect Psychol Sci</source>
          <year>2011</year>
          <month>01</month>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>3</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="doi">10.1177/1745691610393980</pub-id>
          <pub-id pub-id-type="medline">26162106</pub-id>
          <pub-id pub-id-type="pii">6/1/3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mortensen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Hughes</surname>
              <given-names>TL</given-names>
            </name>
          </person-group>
          <article-title>Comparing Amazon's Mechanical Turk platform to conventional data collection methods in the health and medical research literature</article-title>
          <source>J Gen Intern Med</source>
          <year>2018</year>
          <month>04</month>
          <volume>33</volume>
          <issue>4</issue>
          <fpage>533</fpage>
          <lpage>538</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29302882"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11606-017-4246-0</pub-id>
          <pub-id pub-id-type="medline">29302882</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11606-017-4246-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC5880761</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mazor</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>King</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hoppe</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>D'Addario</surname>
              <given-names>Angelo</given-names>
            </name>
            <name name-style="western">
              <surname>Musselman</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tallia</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gallagher</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Using crowdsourced analog patients to provide feedback on physician communication skills</article-title>
          <source>Patient Educ Couns</source>
          <year>2021</year>
          <month>09</month>
          <volume>104</volume>
          <issue>9</issue>
          <fpage>2297</fpage>
          <lpage>2303</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.pec.2021.02.047"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.pec.2021.02.047</pub-id>
          <pub-id pub-id-type="medline">33715944</pub-id>
          <pub-id pub-id-type="pii">S0738-3991(21)00169-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="web">
          <article-title>Guidance exempt research</article-title>
          <source>UW Research</source>
          <access-date>2022-04-28</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.washington.edu/research/policies/guidance-exempt-research-2/">https://www.washington.edu/research/policies/guidance-exempt-research-2/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vriesema</surname>
              <given-names>Cc</given-names>
            </name>
            <name name-style="western">
              <surname>Gehlbach</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Assessing survey satisficing: the impact of unmotivated questionnaire responding on data quality</article-title>
          <source>Educ Res</source>
          <year>2021</year>
          <month>08</month>
          <day>24</day>
          <volume>50</volume>
          <issue>9</issue>
          <fpage>618</fpage>
          <lpage>627</lpage>
          <pub-id pub-id-type="doi">10.3102/0013189X211040054</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Norman</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Non-cognitive factors in health sciences education: from the clinic floor to the cutting room floor</article-title>
          <source>Adv Health Sci Educ Theory Pract</source>
          <year>2010</year>
          <month>03</month>
          <volume>15</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1007/s10459-009-9204-0</pub-id>
          <pub-id pub-id-type="medline">19924553</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10459-009-9204-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sullivan</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Artino</surname>
              <given-names>AR</given-names>
            </name>
          </person-group>
          <article-title>Analyzing and interpreting data from likert-type scales</article-title>
          <source>J Grad Med Educ</source>
          <year>2013</year>
          <month>12</month>
          <volume>5</volume>
          <issue>4</issue>
          <fpage>541</fpage>
          <lpage>2</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24454995"/>
          </comment>
          <pub-id pub-id-type="doi">10.4300/JGME-5-4-18</pub-id>
          <pub-id pub-id-type="medline">24454995</pub-id>
          <pub-id pub-id-type="pii">JGME-5-4-18</pub-id>
          <pub-id pub-id-type="pmcid">PMC3886444</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gallagher</surname>
              <given-names>TH</given-names>
            </name>
            <name name-style="western">
              <surname>Garbutt</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Waterman</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Flum</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Larson</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>Waterman</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Dunagan</surname>
              <given-names>WC</given-names>
            </name>
            <name name-style="western">
              <surname>Fraser</surname>
              <given-names>VJ</given-names>
            </name>
            <name name-style="western">
              <surname>Levinson</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Choosing your words carefully: how physicians would disclose harmful medical errors to patients</article-title>
          <source>Arch Intern Med</source>
          <year>2006</year>
          <volume>166</volume>
          <issue>15</issue>
          <fpage>1585</fpage>
          <lpage>93</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.pec.20202.047"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/archinte.166.15.1585</pub-id>
          <pub-id pub-id-type="medline">16908791</pub-id>
          <pub-id pub-id-type="pii">166/15/1585</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Crick</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Brennan</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <source>Manual for GENOVA: A Generalized Analysis of Variance System</source>
          <year>1983</year>
          <publisher-loc>Iowa City</publisher-loc>
          <publisher-name>ACT Inc</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brennan</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <source>Generalizability Theory</source>
          <year>2001</year>
          <publisher-loc>New York</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chandler</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shapiro</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Conducting clinical research using crowdsourced convenience samples</article-title>
          <source>Annu Rev Clin Psychol</source>
          <year>2016</year>
          <volume>12</volume>
          <fpage>53</fpage>
          <lpage>81</lpage>
          <pub-id pub-id-type="doi">10.1146/annurev-clinpsy-021815-093623</pub-id>
          <pub-id pub-id-type="medline">26772208</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peer</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Vosgerau</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Acquisti</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Reputation as a sufficient condition for data quality on Amazon Mechanical Turk</article-title>
          <source>Behav Res Methods</source>
          <year>2014</year>
          <month>12</month>
          <volume>46</volume>
          <issue>4</issue>
          <fpage>1023</fpage>
          <lpage>31</lpage>
          <pub-id pub-id-type="doi">10.3758/s13428-013-0434-y</pub-id>
          <pub-id pub-id-type="medline">24356996</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Riess</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kraft-Todd</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>E.M.P.A.T.H.Y.: a tool to enhance nonverbal communication between clinicians and their patients</article-title>
          <source>Acad Med</source>
          <year>2014</year>
          <month>08</month>
          <volume>89</volume>
          <issue>8</issue>
          <fpage>1108</fpage>
          <lpage>12</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.lww.com/24826853.pmid"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/ACM.0000000000000287</pub-id>
          <pub-id pub-id-type="medline">24826853</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Drukteinis</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>O'Keefe</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Sanson</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Orban</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Preparing emergency physicians for malpractice litigation: a joint emergency medicine residency-law school mock trial competition</article-title>
          <source>J Emerg Med</source>
          <year>2014</year>
          <month>01</month>
          <volume>46</volume>
          <issue>1</issue>
          <fpage>95</fpage>
          <lpage>103</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jemermed.2013.08.017</pub-id>
          <pub-id pub-id-type="medline">24071029</pub-id>
          <pub-id pub-id-type="pii">S0736-4679(13)00903-7</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
