<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">ResProt</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Res Protoc</journal-id>
      <journal-title>JMIR Research Protocols</journal-title>
      <issn pub-type="epub">1929-0748</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v14i1e63887</article-id>
      <article-id pub-id-type="pmid">39913914</article-id>
      <article-id pub-id-type="doi">10.2196/63887</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Protocol</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Protocol</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>ChatGPT-4 Performance on German Continuing Medical Education—Friend or Foe (Trick or Treat)? Protocol for a Randomized Controlled Trial</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Schwartz</surname>
            <given-names>Amy</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Hang</surname>
            <given-names>Ching Nam</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Liu</surname>
            <given-names>Xu</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>McGowan</surname>
            <given-names>Brian</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Burisch</surname>
            <given-names>Christian</given-names>
          </name>
          <degrees>Dr rer nat</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>State of North Rhine-Westphalia</institution>
            <institution>Regional Government Düsseldorf</institution>
            <institution>Leibniz-Gymnasium</institution>
            <addr-line>Stankeitstraße 22</addr-line>
            <addr-line>Essen, 45326</addr-line>
            <country>Germany</country>
            <fax>49 201 79938722</fax>
            <phone>49 201 79938720</phone>
            <email>christian.burisch@rub.de</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0009-9710-7827</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Bellary</surname>
            <given-names>Abhav</given-names>
          </name>
          <degrees>Cand med</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0004-8349-3468</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Breuckmann</surname>
            <given-names>Frank</given-names>
          </name>
          <degrees>Prof Dr med</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7245-8000</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Ehlers</surname>
            <given-names>Jan</given-names>
          </name>
          <degrees>Prof Dr med vet</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6306-4173</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Thal</surname>
            <given-names>Serge C</given-names>
          </name>
          <degrees>Prof Dr med</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1222-8729</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Sellmann</surname>
            <given-names>Timur</given-names>
          </name>
          <degrees>Dr med</degrees>
          <xref rid="aff7" ref-type="aff">7</xref>
          <xref rid="aff8" ref-type="aff">8</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1471-6806</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Gödde</surname>
            <given-names>Daniel</given-names>
          </name>
          <degrees>Dr med</degrees>
          <xref rid="aff9" ref-type="aff">9</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8430-1411</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>State of North Rhine-Westphalia</institution>
        <institution>Regional Government Düsseldorf</institution>
        <institution>Leibniz-Gymnasium</institution>
        <addr-line>Essen</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Didactics and Education Research in the Health Sector</institution>
        <institution>Faculty of Health</institution>
        <institution>Witten/Herdecke University</institution>
        <addr-line>Witten</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Faculty of Health</institution>
        <institution>Witten/Herdecke University</institution>
        <addr-line>Witten</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of Cardiology, Pneumology, Neurology and Intensive Care Medicine</institution>
        <institution>Klinik Kitzinger Land</institution>
        <addr-line>Kitzingen</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Department of Cardiology and Vascular Medicine</institution>
        <institution>West German Heart and Vascular Center Essen</institution>
        <institution>University Duisburg-Essen</institution>
        <addr-line>Essen</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Department of Anesthesiology</institution>
        <institution>HELIOS University Hospital</institution>
        <addr-line>Wuppertal</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>Department of Anaesthesiology I</institution>
        <institution>Witten-Herdecke University</institution>
        <addr-line>Witten</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff8">
        <label>8</label>
        <institution>Department of Anesthesiology and Intensive Care Medicine</institution>
        <institution>Evangelisches Krankenhaus Hospital, BETHESDA zu Duisburg</institution>
        <addr-line>Duisburg</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff9">
        <label>9</label>
        <institution>Department of Pathology and Molecular Pathology</institution>
        <institution>HELIOS University Hospital Wuppertal, University Witten/Herdecke</institution>
        <addr-line>Witten</addr-line>
        <country>Germany</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Christian Burisch <email>christian.burisch@rub.de</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2025</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>6</day>
        <month>2</month>
        <year>2025</year>
      </pub-date>
      <volume>14</volume>
      <elocation-id>e63887</elocation-id>
      <history>
        <date date-type="received">
          <day>2</day>
          <month>7</month>
          <year>2024</year>
        </date>
        <date date-type="rev-request">
          <day>9</day>
          <month>10</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>2</day>
          <month>12</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>27</day>
          <month>12</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Christian Burisch, Abhav Bellary, Frank Breuckmann, Jan Ehlers, Serge C Thal, Timur Sellmann, Daniel Gödde. Originally published in JMIR Research Protocols (https://www.researchprotocols.org), 06.02.2025.</copyright-statement>
      <copyright-year>2025</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Research Protocols, is properly cited. The complete bibliographic information, a link to the original publication on https://www.researchprotocols.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.researchprotocols.org/2025/1/e63887" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>The increasing development and spread of artificial and assistive intelligence is opening up new areas of application not only in applied medicine but also in related fields such as continuing medical education (CME), which is part of the mandatory training program for medical doctors in Germany. This study aimed to determine whether medical laypersons can successfully conduct training courses specifically for physicians with the help of a large language model (LLM) such as ChatGPT-4. This study aims to qualitatively and quantitatively investigate the impact of using artificial intelligence (AI; specifically ChatGPT) on the acquisition of credit points in German postgraduate medical education.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>Using this approach, we wanted to test further possible applications of AI in the postgraduate medical education setting and obtain results for practical use. Depending on the results, the potential influence of LLMs such as ChatGPT-4 on CME will be discussed, for example, as part of a SWOT (strengths, weaknesses, opportunities, threats) analysis.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We designed a randomized controlled trial, in which adult high school students attempt to solve CME tests across six medical specialties in three study arms in total with 18 CME training courses per study arm under different interventional conditions with varying amounts of permitted use of ChatGPT-4. Sample size calculation was performed including guess probability (20% correct answers, SD=40%; confidence level of 1–α=.95/α=.05; test power of 1–β=.95; <italic>P</italic>&#60;.05). The study was registered at open scientific framework.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>As of October 2024, the acquisition of data and students to participate in the trial is ongoing. Upon analysis of our acquired data, we predict our findings to be ready for publication as soon as early 2025.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>We aim to prove that the advances in AI, especially LLMs such as ChatGPT-4 have considerable effects on medical laypersons’ ability to successfully pass CME tests. The implications that this holds on how the concept of continuous medical education requires reevaluation are yet to be contemplated.</p>
        </sec>
        <sec sec-type="trial registration">
          <title>Trial Registration</title>
          <p>OSF Registries 10.17605/OSF.IO/MZNUF; https://osf.io/mznuf</p>
        </sec>
        <sec sec-type="registered-report">
          <title>International Registered Report Identifier (IRRID)</title>
          <p>PRR1-10.2196/63887</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>ChatGPT</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>large language model</kwd>
        <kwd>postgraduate education</kwd>
        <kwd>continuing medical education</kwd>
        <kwd>self-assessment program</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>ChatGPT-4 is the latest development in the large language model (LLM) family from ChatGPT. It is said to be trained on more than one trillion parameters, making it one of the most advanced LLMs currently available for generating conversation-style responses to user input. The parameters are the numerical values that determine how a neural network processes input data and produces output data. They are learned from data during the training process, encoding the model’s knowledge and skills [<xref ref-type="bibr" rid="ref1">1</xref>].</p>
      <p>Since its launch by OpenAI, the ChatGPT family has stimulated widespread conversation and momentum across different specialties in medicine, as demonstrated by more than 3300 publications related to ChatGPT (or Chat-GPT) indexed in PubMed as of mid-May 2024. Generally, LLMs enable humans to interact and discuss a broad range of topics with artificial intelligence (AI) chatbots. New features of ChatGPT-4 include the acceptance of images as input and the generation of captions, classifications, and analyses, which were not available in earlier versions. Compared to its predecessors, ChatGPT-4 is 82% less likely to respond to inappropriate content requests and 40% more likely to provide factual answers than GPT-3 in internal evaluations [<xref ref-type="bibr" rid="ref2">2</xref>].</p>
      <p>After its success in passing the United States Medical Licensing Examination, performing at a level comparable to that of a third-year medical student [<xref ref-type="bibr" rid="ref3">3</xref>], these results have been largely confirmed across various medical specialties. Comparisons with different ChatGPT versions and other LLM providers, such as Google, support these findings [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref13">13</xref>]. There are currently two reviews on this topic [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>], and recent data specific to Germany have been published [<xref ref-type="bibr" rid="ref16">16</xref>].</p>
      <p>In conclusion, there is now a range of data on the use of LLMs in undergraduate education and teaching but less on postgraduate education, such as continuing medical education (CME) [<xref ref-type="bibr" rid="ref17">17</xref>] or self-assessment programs [<xref ref-type="bibr" rid="ref4">4</xref>]. <xref ref-type="table" rid="table1">Table 1</xref> shows a selection of studies on this topic.</p>
      <p>In Germany, CME, which is mandatory for medical specialists, requires earning 250 training points over five years. These CME points can be acquired through further specialization, attending congresses and conferences, and studying medical literature with consecutive answers to specific questions in the text. This approach essentially “credits” the self-study time spent attentively reading a text and then answering questions.</p>
      <p>For this study, we decided to use ChatGPT-4 because of its extensive database and ability to enter texts directly. Additionally, the input and operation of ChatGPT are carried out by adult high school students without any prior medical training. This was to differentiate as clearly as possible whether and to what extent LLMs can offer support today. This study aims to provide further insight into whether AI, in the form of LLMs, can support various levels of medical education by correctly answering CME-relevant questions, allowing participants to generate CME credits independently of existing medical knowledge.</p>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>Data on ChatGPT and postgraduate medical education (continuing medical education or self-assessment programs).</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="100"/>
          <col width="60"/>
          <col width="110"/>
          <col width="200"/>
          <col width="260"/>
          <col width="270"/>
          <thead>
            <tr valign="top">
              <td>First author</td>
              <td>Year</td>
              <td>Study</td>
              <td>Comparator</td>
              <td>Major findings</td>
              <td>Conclusions</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Sherazi and Canes [<xref ref-type="bibr" rid="ref4">4</xref>]</td>
              <td>2023</td>
              <td>Comparative trial</td>
              <td>ChatGPT-3.5 versus ChatGPT-4</td>
              <td>GPT-4 scored significantly higher than GPT-3.5 on the AUA<sup>a</sup> SASP<sup>b</sup> examinations in overall performance, across all test years, and in various urology topic areas.</td>
              <td>Results suggest improvement in evolving AI<sup>c</sup> LLM<sup>d</sup> in answering clinical urology questions. Certain aspects of medical knowledge and clinical reasoning remain challenging for LLM.</td>
            </tr>
            <tr valign="top">
              <td>Riedel et al [<xref ref-type="bibr" rid="ref16">16</xref>]</td>
              <td>2023</td>
              <td>Comparative trial</td>
              <td>Performance of ChatGPT on OB/GYN<sup>e</sup> course examinations versus questions from the German medical state licensing examinations</td>
              <td>ChatGPT demonstrated consistent and comparable performance across both datasets, providing correct responses at a rate comparable with that of medical students.</td>
              <td>ChatGPT has promise as a supplementary tool in medical education and clinical practice, providing efficient and personalized learning experiences and assistance for health care providers.</td>
            </tr>
            <tr valign="top">
              <td>Noda et al [<xref ref-type="bibr" rid="ref18">18</xref>]</td>
              <td>2024</td>
              <td>Comparative trial</td>
              <td>ChatGPT-3.5 versus ChatGPT-4 versus Bard (Gemini)</td>
              <td>GPT-3.5 and Bard performed similarly while being significantly surpassed by GPT-4. GPT-4’s performance was between third- and fourth-year nephrology residents.</td>
              <td>GPT-4 outperformed GPT-3.5 and Bard, meeting the Nephrology Board renewal standards in specific years, albeit marginally. The results highlight LLMs potential and limitations.</td>
            </tr>
            <tr valign="top">
              <td>Ali et al [<xref ref-type="bibr" rid="ref6">6</xref>]</td>
              <td>2023</td>
              <td>Comparative trial</td>
              <td>ChatGPT-3.5 versus ChatGPT-4 versus user average</td>
              <td>GPT-4 significantly outperformed question bank users and GPT-3.5. Increased word count and higher-order problem-solving were associated with lower accuracy for GPT-3.5 not however for GPT-4.</td>
              <td>LLMs achieved passing scores on a mock 500-question neurosurgical written board examination, with GPT-4 significantly outperforming ChatGPT.</td>
            </tr>
            <tr valign="top">
              <td>Watari et al [<xref ref-type="bibr" rid="ref13">13</xref>]</td>
              <td>2023</td>
              <td>Comparison study</td>
              <td>Chat GPT-4 versus Japanese Residents’ performance on GM-ITE<sup>f</sup></td>
              <td>Of 137 GM-ITE questions in Japanese, GPT-4 scores were significantly higher than the mean scores of residents.</td>
              <td>GPT-4 demonstrated a tendency to score higher on difficult questions. However, GPT-4 scored comparatively lower on questions testing attitudes toward patients and professionalism requiring an understanding of context and communication.</td>
            </tr>
            <tr valign="top">
              <td>Guerra et al [<xref ref-type="bibr" rid="ref5">5</xref>]</td>
              <td>2023</td>
              <td>Comparative trial</td>
              <td>ChatGPT-4 versus ChatGPT, SANS<sup>g</sup> users, medical students, and neurosurgery residents</td>
              <td>GPT-4 outperformed ChatGPT exceeding the performances of medical students, neurosurgery residents, and the national average of SANS users across all categories.</td>
              <td> GPT-4 significantly outperformed medical students, neurosurgery residents, and the national average of SANS users.</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table1fn1">
            <p><sup>a</sup>AUA: American Urological Association.</p>
          </fn>
          <fn id="table1fn2">
            <p><sup>b</sup>SASP: self-assessment study program.</p>
          </fn>
          <fn id="table1fn3">
            <p><sup>c</sup>AI: artificial intelligence.</p>
          </fn>
          <fn id="table1fn4">
            <p><sup>d</sup>LLM: large language model.</p>
          </fn>
          <fn id="table1fn5">
            <p><sup>e</sup>OB/GYN: obstetrics and gynecology.</p>
          </fn>
          <fn id="table1fn6">
            <p><sup>f</sup>GM-ITE: General Medicine In-Training Examination.</p>
          </fn>
          <fn id="table1fn7">
            <p><sup>g</sup>SANS: self-assessment in neurosurgery examination.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Study Design</title>
        <p>This is a randomized controlled trial that will be undertaken following the Declaration of Helsinki principles and after approval by the local Ethics Committee of Witten/Herdecke University (S-108/2024, date of approval May 15, 2024) and after registration in a study register (open scientific framework). To obtain representative, comprehensive, and meaningful data, three large German publishing houses (Deutscher Ärzteverlag GmbH, Cologne; Georg Thieme Verlag KG, Stuttgart; and Springer Medizin Verlag, Heidelberg) that offer journals with CME will be evaluated for one volume each of already expired journals (ie, without the possibility of earning credit points) from the fields of internal medicine, surgery, gynecology, pediatrics, neurology, and anesthesiology. The CME tests provided by the publishing houses needed no further adaptation for utilization in the study.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>The study protocol which was submitted to and accepted by the Ethics Committee of University Witten/Herdecke (S-108/2024, date of approval May 15, 2024) stated decisively that no monetary or other compensation was to occur. The participant’s information was depersonalized by means of not collecting any personal information to begin with, as they were deemed insignificant to the study’s results leading to participants enrolling entirely voluntarily. Furthermore, to participate in the study, the students were required to provide a signed informed consent form which all students were given the opportunity to voice concerns and questions and were informed about their ability to revoke their consent without having to provide a reason, while not having to expect any repercussions.</p>
      </sec>
      <sec>
        <title>Study Participants</title>
        <p>To minimize any influence from prior medical knowledge on the results, adult high school students from North Rhine-Westphalia who are willing to participate will be randomized into three study arms. As high school students can be assumed to be void of relevant medical prior education, the choice to include this group as participants is based on its ability to represent the approximate level of medical knowledge of the general population. The inclusion and exclusion criteria are shown in <xref ref-type="boxed-text" rid="box1">Textbox 1</xref>. It should be emphasized that it is not the high school students who are the participants of the study but the CME course tests to which the methods of the three study arms are applied. Careful considerations were put into the selection of the CME tests screening for images of diseases that students may have deemed disturbing. Such CMEs were excluded. The students were encouraged to voice concerns if the contents of the CME tests resulted in uneasiness. Furthermore, ample opportunity was provided for discussing the students’ experiences if deemed necessary by the participants. All these measures aided in minimizing the potential psychological impact of participation in the study. The experience of the participants while attempting to solve the CME tests is not represented in the study’s results as they were deemed to exceed the scope of the study. The student’s proficiency in the German language was required in the hope of avoiding skewed results based on linguistic incomprehension of the provided literature. The students act purely as “tools,” preferably without any medical knowledge of their own.</p>
        <boxed-text id="box1" position="float">
          <title>Inclusion and exclusion criteria.</title>
          <p>
            <bold>Inclusion criteria</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>Aged 18 years or older</p>
            </list-item>
            <list-item>
              <p>Voluntary participation</p>
            </list-item>
            <list-item>
              <p>No financial compensation</p>
            </list-item>
            <list-item>
              <p>German as a native language or at a native speaker level</p>
            </list-item>
            <list-item>
              <p>Ability to operate ChatGPT or other required software</p>
            </list-item>
          </list>
          <p>
            <bold>Exclusion criteria</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>Being underage</p>
            </list-item>
            <list-item>
              <p>Refusal to participate</p>
            </list-item>
            <list-item>
              <p>Insufficient German language skills</p>
            </list-item>
            <list-item>
              <p>Inability to operate ChatGPT or other required software</p>
            </list-item>
          </list>
        </boxed-text>
      </sec>
      <sec>
        <title>Interventions</title>
        <p>This trial is designed as a three-armed randomized controlled trial, including one control arm.</p>
        <sec>
          <title>Intervention Group 1: “All-In”</title>
          <p>In this group, CME-subject-specific text is entered into ChatGPT-4 first, and then, the questions are answered by ChatGPT based on that input.</p>
        </sec>
        <sec>
          <title>Intervention Group 2: “Just Answers”</title>
          <p>In this group, questions are answered using only the knowledge available in the ChatGPT-4 database at that time, without entering any subject-specific text first.</p>
        </sec>
        <sec>
          <title>Control Group 3: “Search and Find”</title>
          <p>Participants in this group were asked to answer the questions using only keywords and common sense without any AI support. As the CME were viewed as digital files, the use of “find in text” of the respective document viewing software was permitted.</p>
          <p>The approach to having the CME test questions answered in three study arms aims to uncover significant differences in ChatGPT-4’s ability to solve the CME tests, as well as assess the varying time required in the individual study arms.</p>
        </sec>
      </sec>
      <sec>
        <title>Data Analysis</title>
        <p>Sample size calculation was performed for the hypothesis that CME test results will improve from guess probability (20% correct answers, SD= 40%) to pass level (70% correct answers) with a confidence level of 1–α=.95, that is, α=.05, and a test power of 1–β=.95. Therefore, for an independent-samples, two-sided study, a sample size of at least 18 CME training courses per study arm is needed. Nonetheless, since the CME courses, as our study subjects, can be processed repeatedly using different methods without altering them or the methods, a paired-sample study is possible and preferable. This allows the same CME courses to be used in the three study arms. Although a sample size of 9 for a single-sided paired-sample study would be sufficient (only an improvement in CME test results is expected and desired by applying the study arm methods), we decided to take a conservative route and will work with 18 CME tests that will be run through all three study arms. The CME tests treated were randomly chosen from a large number of available tests. Care was taken to ensure that every high school student completed the same number of tests in each arm of the study so that confounding variables in the students were evenly distributed across the three groups. In addition, none of them would work on a single CME test twice using different methods to avoid learning effects. Together with the reuse of the CME tests in the three study arms (paired study, see above), these measures prevent any bias arising from the high school students as performing tools or the CME tests themselves as study participants. The AI-supported arms would run through within the shortest possible time and in the correct order so that unwanted training of the AI or the students during the process could be ruled out as much as possible. Statistical data analysis will be performed using the open-source software “R” (R Core Team; 2023). The data is presented as mean ± SD. Since the aim of the study is to identify differences in the percentage test results due to the different approaches in the three study arms, the Student <italic>t</italic> test (1-tailed) or the Mann-Whitney <italic>U</italic> test will be used for the pairwise comparison of means between groups, depending on the normality of the datasets. The Shapiro-Wilk test will be used to check normality. Fisher’s exact test was used to assess the independence of categorical variables. Benjamini-Hochberg adjustments of <italic>P</italic> values will be applied in multiple comparisons. Values of <italic>P</italic>&#60;.05 were considered statistically significant.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>As of October 2024, we have tested five out of the six students we deemed necessary to examine the 18 CME tests across the three study arms. We are set to terminate the data acquisition by November 2024. The ensuing data analysis is predicted to end in December 2024, enabling us to present our results as early as early 2025.</p>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>To present the influence of AI as objectively as possible, we deliberately refrained from using medically trained test participants. This allowed us to identify the pure influence of AI. Depending on the degree of success, it was necessary to determine to what extent AI can be permissible in CME training courses and what conditions or protective measures were to be imposed.</p>
        <p>Since its launch in 2023, not only the development of ChatGPT but also its integration into the medical context increased rapidly, as shown by the ever more extensive database versions and the steadily growing number of medical publications [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref23">23</xref>]. However, as the capabilities of AI increase, so does the responsibility of actual intelligence to use it in the best possible way for the benefit of all without causing harm (“primum nihil nocere”). Even if the use of AI to solve examinations, whether student or specialist examinations, has already been investigated several times, there is still a knowledge gap in postgraduate teaching and its effects. Ethical, social, and above all, legal aspects, also need to be clarified.</p>
        <p>AI has the potential to revolutionize various aspects of our lives. In medicine, its strength lies in its wide range of possible applications. However, the use of AI in education, training, and specialization must be clearly labeled, as it presents not only opportunities but also weaknesses and threats, particularly with the use of LLMs such as ChatGPT and related programs [<xref ref-type="bibr" rid="ref1">1</xref>]. The correct use of AI in postgraduate medical education, especially LLMs, still needs to be explored and discussed.</p>
        <p>This study aims to show that medical training tests can be successfully completed by medical laypersons using AI, which raises questions about the continued usefulness of current training programs, potential regulations to prevent misuse, and opportunities to harness AI capabilities in this context. Currently, self-study to obtain CME credits is an integral part of German postgraduate medical education. This study’s results may have the potential to influence this practice significantly.</p>
        <p>The decision to examine ChatGPT’s results in three study arms was based on the hope of being able to compare the results obtained while gaining insight into whether the literature backgrounds of the CME were required to generate significantly superior results.</p>
        <p>The rationale behind the choice of medical specialties whose CME tests were analyzed in the study results from ChatGPT-4’s ability to merely process text. All the medical specialties we chose to include do not predominantly diagnose based on visual symptoms. However, a new investigation on newer ChatGPT versions, which possess the ability to obtain information from images is underway.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>This study has several limitations. First, only German CMEs are evaluated. Second, only a minority of specialties were chosen. Finally, we completely dispensed CME with image content, as is usual in radiology, dermatology, or pathology, for example, to avoid changing the selectivity.</p>
        <p>How potential biases that result from the data that was used in training the AI tools impacted the results of the study is not derivable, as ChatGPT does not possess knowledge in the classical sense. It is rather the case that lexical data is produced based on prior training.</p>
        <p>If knowledge acquired through AI-generated literature is retained differently than medically conventionally attained knowledge is yet to be assessed in future research.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>The impact on current on future CME programs should be considered as the certified means of personalizing one’s medical education remains scarce. AI could play a role in tailoring continuous education to personalized needs and, for example, adapting the modules based on prior results to target potential individual shortcomings. The role AI could play in medical education provided by university faculties, as well as personalized learning programs surely merits further investigation [<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref26">26</xref>].</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CME</term>
          <def>
            <p>continuing medical education</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This research received no external funding.</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The datasets generated during or analyzed during this study are not yet publicly available as they are yet to be analyzed but can be made available from the corresponding author upon reasonable request.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>The conceptualization was a result of cooperation by TS, DG, AB, and CB; the formal analysis was performed by CB, AB, DG, and TS; funding acquisition was accomplished by DG; our methodology was developed by TS, FB, and JE; project administration was supervised by TS and DG; the original draft was written by CB and AB, and it was then rewritten, edited, and reviewed by TS, JE CB, AB, FB, SCT, and DG. All authors have read and agreed to the published version of the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gödde</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Nöhl</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wolf</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rupert</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rimkus</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ehlers</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Breuckmann</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Sellmann</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>A SWOT (strengths, weaknesses, opportunities, and threats) analysis of ChatGPT in the medical literature: concise review</article-title>
          <source>J Med Internet Res</source>
          <year>2023</year>
          <volume>25</volume>
          <fpage>e49368</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2023//e49368/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/49368</pub-id>
          <pub-id pub-id-type="medline">37865883</pub-id>
          <pub-id pub-id-type="pii">v25i1e49368</pub-id>
          <pub-id pub-id-type="pmcid">PMC10690535</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <source>ChatGPT-4</source>
          <access-date>2024-05-16</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://chatgpt.ch/gpt-4/">https://chatgpt.ch/gpt-4/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gilson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Safranek</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Socrates</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Chi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Chartash</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>How does ChatGPT perform on the United States Medical Licensing Examination (USMLE)? The implications of large language models for medical education and knowledge assessment</article-title>
          <source>JMIR Med Educ</source>
          <year>2023</year>
          <volume>9</volume>
          <fpage>e45312</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2023//e45312/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/45312</pub-id>
          <pub-id pub-id-type="medline">36753318</pub-id>
          <pub-id pub-id-type="pii">v9i1e45312</pub-id>
          <pub-id pub-id-type="pmcid">PMC9947764</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sherazi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Canes</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Comprehensive analysis of the performance of GPT-3.5 and GPT-4 on the American Urological Association self-assessment study program exams from 2012-2023</article-title>
          <source>Can Urol Assoc J</source>
          <year>2023</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.5489/cuaj.8526"/>
          </comment>
          <pub-id pub-id-type="doi">10.5489/cuaj.8526</pub-id>
          <pub-id pub-id-type="medline">38381942</pub-id>
          <pub-id pub-id-type="pii">cuaj.8526</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guerra</surname>
              <given-names>GA</given-names>
            </name>
            <name name-style="western">
              <surname>Hofmann</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Sobhani</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hofmann</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gomez</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Soroudi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hopkins</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Dallas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pangal</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Cheok</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>VN</given-names>
            </name>
            <name name-style="western">
              <surname>Mack</surname>
              <given-names>WJ</given-names>
            </name>
            <name name-style="western">
              <surname>Zada</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>GPT-4 artificial intelligence model outperforms ChatGPT, medical students, and neurosurgery residents on neurosurgery written board-like questions</article-title>
          <source>World Neurosurg</source>
          <year>2023</year>
          <volume>179</volume>
          <fpage>e160</fpage>
          <lpage>e165</lpage>
          <pub-id pub-id-type="doi">10.1016/j.wneu.2023.08.042</pub-id>
          <pub-id pub-id-type="medline">37597659</pub-id>
          <pub-id pub-id-type="pii">S1878-8750(23)01144-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>OY</given-names>
            </name>
            <name name-style="western">
              <surname>Connolly</surname>
              <given-names>ID</given-names>
            </name>
            <name name-style="western">
              <surname>Sullivan</surname>
              <given-names>PLZ</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Fridley</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Asaad</surname>
              <given-names>WF</given-names>
            </name>
            <name name-style="western">
              <surname>Cielo</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Oyelese</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Doberstein</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Gokaslan</surname>
              <given-names>ZL</given-names>
            </name>
            <name name-style="western">
              <surname>Telfeian</surname>
              <given-names>AE</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT and GPT-4 on neurosurgery written board examinations</article-title>
          <source>Neurosurgery</source>
          <year>2023</year>
          <volume>93</volume>
          <issue>6</issue>
          <fpage>1353</fpage>
          <lpage>1365</lpage>
          <pub-id pub-id-type="doi">10.1227/neu.0000000000002632</pub-id>
          <pub-id pub-id-type="medline">37581444</pub-id>
          <pub-id pub-id-type="pii">00006123-202312000-00018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>OY</given-names>
            </name>
            <name name-style="western">
              <surname>Connolly</surname>
              <given-names>ID</given-names>
            </name>
            <name name-style="western">
              <surname>Fridley</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Sullivan</surname>
              <given-names>PLZ</given-names>
            </name>
            <name name-style="western">
              <surname>Cielo</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Oyelese</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Doberstein</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Telfeian</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Gokaslan</surname>
              <given-names>ZL</given-names>
            </name>
            <name name-style="western">
              <surname>Asaad</surname>
              <given-names>WF</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT, GPT-4, and Google bard on a neurosurgery oral boards preparation question bank</article-title>
          <source>Neurosurgery</source>
          <year>2023</year>
          <volume>93</volume>
          <issue>5</issue>
          <fpage>1090</fpage>
          <lpage>1098</lpage>
          <pub-id pub-id-type="doi">10.1227/neu.0000000000002551</pub-id>
          <pub-id pub-id-type="medline">37306460</pub-id>
          <pub-id pub-id-type="pii">00006123-990000000-00775</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Yunus</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sohail</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rehman</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Saeed</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Jackson</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Sharkey</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mahmood</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Matyal</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence for anesthesiology board-style examination questions: role of large language models</article-title>
          <source>J Cardiothorac Vasc Anesth</source>
          <year>2024</year>
          <volume>38</volume>
          <issue>5</issue>
          <fpage>1251</fpage>
          <lpage>1259</lpage>
          <pub-id pub-id-type="doi">10.1053/j.jvca.2024.01.032</pub-id>
          <pub-id pub-id-type="medline">38423884</pub-id>
          <pub-id pub-id-type="pii">S1053-0770(24)00090-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hofmann</surname>
              <given-names>HL</given-names>
            </name>
            <name name-style="western">
              <surname>Guerra</surname>
              <given-names>GA</given-names>
            </name>
            <name name-style="western">
              <surname>Le</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Hofmann</surname>
              <given-names>GH</given-names>
            </name>
            <name name-style="western">
              <surname>Mayfield</surname>
              <given-names>CK</given-names>
            </name>
            <name name-style="western">
              <surname>Petrigliano</surname>
              <given-names>FA</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>JN</given-names>
            </name>
          </person-group>
          <article-title>The rapid development of artificial intelligence: GPT-4's performance on orthopedic surgery board questions</article-title>
          <source>Orthopedics</source>
          <year>2024</year>
          <volume>47</volume>
          <issue>2</issue>
          <fpage>e85</fpage>
          <lpage>e89</lpage>
          <pub-id pub-id-type="doi">10.3928/01477447-20230922-05</pub-id>
          <pub-id pub-id-type="medline">37757748</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lum</surname>
              <given-names>ZC</given-names>
            </name>
          </person-group>
          <article-title>Can artificial intelligence pass the American Board of Orthopaedic Surgery Examination? Orthopaedic residents versus ChatGPT</article-title>
          <source>Clin Orthop Relat Res</source>
          <year>2023</year>
          <volume>481</volume>
          <issue>8</issue>
          <fpage>1623</fpage>
          <lpage>1630</lpage>
          <pub-id pub-id-type="doi">10.1097/CORR.0000000000002704</pub-id>
          <pub-id pub-id-type="medline">37220190</pub-id>
          <pub-id pub-id-type="pii">00003086-990000000-01207</pub-id>
          <pub-id pub-id-type="pmcid">PMC10344569</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Massey</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Montgomery</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>AS</given-names>
            </name>
          </person-group>
          <article-title>Comparison of ChatGPT-3.5, ChatGPT-4, and orthopaedic resident performance on orthopaedic assessment examinations</article-title>
          <source>J Am Acad Orthop Surg</source>
          <year>2023</year>
          <volume>31</volume>
          <issue>23</issue>
          <fpage>1173</fpage>
          <lpage>1179</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37671415"/>
          </comment>
          <pub-id pub-id-type="doi">10.5435/JAAOS-D-23-00396</pub-id>
          <pub-id pub-id-type="medline">37671415</pub-id>
          <pub-id pub-id-type="pii">00124635-990000000-00782</pub-id>
          <pub-id pub-id-type="pmcid">PMC10627532</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Fang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ling</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Abudukeremu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT on the Chinese postgraduate examination for clinical medicine: survey study</article-title>
          <source>JMIR Med Educ</source>
          <year>2024</year>
          <volume>10</volume>
          <fpage>e48514</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2024//e48514/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/48514</pub-id>
          <pub-id pub-id-type="medline">38335017</pub-id>
          <pub-id pub-id-type="pii">v10i1e48514</pub-id>
          <pub-id pub-id-type="pmcid">PMC10891494</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Watari</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Takagi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sakaguchi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Nishizaki</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shimizu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Yamamoto</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tokuda</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Performance comparison of ChatGPT-4 and Japanese medical residents in the general medicine in-training examination: comparison study</article-title>
          <source>JMIR Med Educ</source>
          <year>2023</year>
          <volume>9</volume>
          <fpage>e52202</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2023//e52202/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/52202</pub-id>
          <pub-id pub-id-type="medline">38055323</pub-id>
          <pub-id pub-id-type="pii">v9i1e52202</pub-id>
          <pub-id pub-id-type="pmcid">PMC10733815</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sumbal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sumbal</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Amir</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Can ChatGPT-3.5 pass a medical exam? A systematic review of ChatGPT's performance in academic testing</article-title>
          <source>J Med Educ Curric Dev</source>
          <year>2024</year>
          <volume>11</volume>
          <fpage>23821205241238641</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/23821205241238641?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/23821205241238641</pub-id>
          <pub-id pub-id-type="medline">38487300</pub-id>
          <pub-id pub-id-type="pii">10.1177_23821205241238641</pub-id>
          <pub-id pub-id-type="pmcid">PMC10938614</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>TW</given-names>
            </name>
          </person-group>
          <article-title>Application of artificial intelligence chatbots, including ChatGPT, in education, scholarly work, programming, and content generation and its prospects: a narrative review</article-title>
          <source>J Educ Eval Health Prof</source>
          <year>2023</year>
          <volume>20</volume>
          <fpage>38</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.doi.org/10.3352/jeehp.2023.20.38"/>
          </comment>
          <pub-id pub-id-type="doi">10.3352/jeehp.2023.20.38</pub-id>
          <pub-id pub-id-type="medline">38148495</pub-id>
          <pub-id pub-id-type="pii">jeehp.2023.20.38</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Riedel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kaefinger</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Stuehrenberg</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ritter</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Amann</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Graf</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Recker</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Klein</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kiechle</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Riedel</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Meyer</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT's performance in German OB/GYN exams—paving the way for AI-enhanced medical education and clinical practice</article-title>
          <source>Front Med (Lausanne)</source>
          <year>2023</year>
          <volume>10</volume>
          <fpage>1296615</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38155661"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fmed.2023.1296615</pub-id>
          <pub-id pub-id-type="medline">38155661</pub-id>
          <pub-id pub-id-type="pmcid">PMC10753765</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Seetharaman</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Revolutionizing medical education: can ChatGPT boost subjective learning and expression?</article-title>
          <source>J Med Syst</source>
          <year>2023</year>
          <volume>47</volume>
          <issue>1</issue>
          <fpage>61</fpage>
          <pub-id pub-id-type="doi">10.1007/s10916-023-01957-w</pub-id>
          <pub-id pub-id-type="medline">37160568</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10916-023-01957-w</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Noda</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Izaki</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kitano</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Komatsu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ichikawa</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Shibagaki</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT and Bard in self-assessment questions for nephrology board renewal</article-title>
          <source>Clin Exp Nephrol</source>
          <year>2024</year>
          <volume>28</volume>
          <issue>5</issue>
          <fpage>465</fpage>
          <lpage>469</lpage>
          <pub-id pub-id-type="doi">10.1007/s10157-023-02451-w</pub-id>
          <pub-id pub-id-type="medline">38353783</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10157-023-02451-w</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Flores-Cohaila</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>García-Vicente</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Vizcarra-Jiménez</surname>
              <given-names>SF</given-names>
            </name>
            <name name-style="western">
              <surname>De la Cruz-Galán</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Gutiérrez-Arratia</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Torres</surname>
              <given-names>BGQ</given-names>
            </name>
            <name name-style="western">
              <surname>Taype-Rondan</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT on the peruvian national licensing medical examination: cross-sectional study</article-title>
          <source>JMIR Med Educ</source>
          <year>2023</year>
          <volume>9</volume>
          <fpage>e48039</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2023//e48039/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/48039</pub-id>
          <pub-id pub-id-type="medline">37768724</pub-id>
          <pub-id pub-id-type="pii">v9i1e48039</pub-id>
          <pub-id pub-id-type="pmcid">PMC10570896</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meo</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Alotaibi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Meo</surname>
              <given-names>MZS</given-names>
            </name>
            <name name-style="western">
              <surname>Meo</surname>
              <given-names>MOS</given-names>
            </name>
            <name name-style="western">
              <surname>Hamid</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Medical knowledge of ChatGPT in public health, infectious diseases, COVID-19 pandemic, and vaccines: multiple choice questions examination based performance</article-title>
          <source>Front Public Health</source>
          <year>2024</year>
          <volume>12</volume>
          <fpage>1360597</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38711764"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fpubh.2024.1360597</pub-id>
          <pub-id pub-id-type="medline">38711764</pub-id>
          <pub-id pub-id-type="pmcid">PMC11073538</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meo</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Masri</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Alotaibi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Meo</surname>
              <given-names>MZS</given-names>
            </name>
            <name name-style="western">
              <surname>Meo</surname>
              <given-names>MOS</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT knowledge evaluation in basic and clinical medical sciences: multiple choice question examination-based performance</article-title>
          <source>Healthcare (Basel)</source>
          <year>2023</year>
          <volume>11</volume>
          <issue>14</issue>
          <fpage>2046</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=healthcare11142046"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/healthcare11142046</pub-id>
          <pub-id pub-id-type="medline">37510487</pub-id>
          <pub-id pub-id-type="pii">healthcare11142046</pub-id>
          <pub-id pub-id-type="pmcid">PMC10379728</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ghosh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jindal</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>VK</given-names>
            </name>
            <name name-style="western">
              <surname>Bansal</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bajwa</surname>
              <given-names>NK</given-names>
            </name>
            <name name-style="western">
              <surname>Sett</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Is ChatGPT's knowledge and interpretative ability comparable to first professional MBBS (Bachelor of Medicine, Bachelor of Surgery) students of India in taking a medical biochemistry examination?</article-title>
          <source>Cureus</source>
          <year>2023</year>
          <volume>15</volume>
          <issue>10</issue>
          <fpage>e47329</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38021639"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.47329</pub-id>
          <pub-id pub-id-type="medline">38021639</pub-id>
          <pub-id pub-id-type="pmcid">PMC10657167</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="web">
          <article-title>R: a language and environment for statistical computing</article-title>
          <source>R Foundation for Statistical Computing</source>
          <access-date>2024-05-30</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.R-project.org">https://www.R-project.org</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Steffen</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Nils</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Henner</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kristina</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Stefan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Torsten</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Luis</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Alexander</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Maximilian</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Caroline</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Manfred</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mareike</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Unlocking the power of generative AI models and systems such as GPT-4 and ChatGPT for higher education: a guide for students and lecturers</article-title>
          <source>Hohenheim Discussion Papers in Business, Economics and Social Sciences, No. 02-2023, Universität Hohenheim, Fakultät Wirtschafts- und Sozialwissenschaften, Stuttgart</source>
          <year>2023</year>
          <access-date>2025-01-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://nbn-resolving.de/urn:nbn:de:bsz:100-opus-21463">https://nbn-resolving.de/urn:nbn:de:bsz:100-opus-21463</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hang</surname>
              <given-names>CN</given-names>
            </name>
            <name name-style="western">
              <surname>Wei Tan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>MCQGen: a large language model-driven MCQ generator for personalized learning</article-title>
          <source>IEEE Access</source>
          <year>2024</year>
          <volume>12</volume>
          <fpage>102261</fpage>
          <lpage>102273</lpage>
          <pub-id pub-id-type="doi">10.1109/access.2024.3420709</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fuchs</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Exploring the opportunities and challenges of NLP models in higher education: is Chat GPT a blessing or a curse?</article-title>
          <source>Front. Educ</source>
          <year>2023</year>
          <volume>8</volume>
          <pub-id pub-id-type="doi">10.3389/feduc.2023.1166682</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
