<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Res Protoc</journal-id><journal-id journal-id-type="publisher-id">ResProt</journal-id><journal-id journal-id-type="index">5</journal-id><journal-title>JMIR Research Protocols</journal-title><abbrev-journal-title>JMIR Res Protoc</abbrev-journal-title><issn pub-type="epub">1929-0748</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v14i1e76776</article-id><article-id pub-id-type="doi">10.2196/76776</article-id><article-categories><subj-group subj-group-type="heading"><subject>Protocol</subject></subj-group></article-categories><title-group><article-title>Improving the Reporting Quality of Studies on Information Extraction From Clinical Texts: Protocol for the Development of a Consensus-Based Reporting Guideline</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Reichenpfader</surname><given-names>Daniel</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>M&#x00FC;ller</surname><given-names>Henning</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Denecke</surname><given-names>Kerstin</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Institute for Patient-Centered Digital Health, Department of Engineering and Computer Science, Bern University of Applied Sciences</institution><addr-line>Quellgasse 21</addr-line><addr-line>Biel</addr-line><country>Switzerland</country></aff><aff id="aff2"><institution>PhD School of Life Sciences, Faculty of Medicine, University of Geneva</institution><addr-line>Geneva</addr-line><country>Switzerland</country></aff><aff id="aff3"><institution>Department of Radiology and Medical Informatics, University of Geneva</institution><addr-line>Geneva</addr-line><country>Switzerland</country></aff><aff id="aff4"><institution>Informatics Institute, HES-SO Valais-Wallis</institution><addr-line>Sierre</addr-line><country>Switzerland</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Sarvestan</surname><given-names>Javad</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Zheng</surname><given-names>Jiaping</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Blazey</surname><given-names>Paul</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Daniel Reichenpfader, MSc, Institute for Patient-Centered Digital Health, Department of Engineering and Computer Science, Bern University of Applied Sciences, Quellgasse 21, Biel, 2502, Switzerland, 41 31 848 60 93; <email>daniel.reichenpfader@bfh.ch</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>24</day><month>9</month><year>2025</year></pub-date><volume>14</volume><elocation-id>e76776</elocation-id><history><date date-type="received"><day>30</day><month>04</month><year>2025</year></date><date date-type="rev-recd"><day>10</day><month>09</month><year>2025</year></date><date date-type="accepted"><day>15</day><month>09</month><year>2025</year></date></history><copyright-statement>&#x00A9; Daniel Reichenpfader, Henning M&#x00FC;ller, Kerstin Denecke. Originally published in JMIR Research Protocols (<ext-link ext-link-type="uri" xlink:href="https://www.researchprotocols.org">https://www.researchprotocols.org</ext-link>), 24.9.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Research Protocols, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.researchprotocols.org">https://www.researchprotocols.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://www.researchprotocols.org/2025/1/e76776"/><abstract><sec><title>Background</title><p>Information extraction (IE) from clinical texts is increasingly important in health care; yet, reporting practices remain inconsistent. Existing guidelines do not fully address the unique challenges of IE studies. IE methods vary widely in their design, ranging from rule-based systems to advanced large language models, contributing to heterogeneity in reporting. While several reporting frameworks exist for applications of artificial intelligence in health care, they primarily focus on prediction modeling or clinical trials and associated protocols rather than text-based IE.</p></sec><sec><title>Objective</title><p>This study aims to develop the Clinical Information Extraction (CINEX) guideline, a consensus-based reporting guideline for studies on clinical IE.</p></sec><sec sec-type="methods"><title>Methods</title><p>The CINEX guideline is developed following an established guideline methodology, including a 3-round electronic Delphi (eDelphi) study with domain experts and a final in-person consensus meeting. The eDelphi process includes feedback loops and predefined consensus thresholds, with items rated on a 10-point scale for both relevance and maturity. The final consensus meeting is held as a hybrid workshop at the MEDINFO 2025 conference and focuses on finalizing the items that reached consensus.</p></sec><sec sec-type="results"><title>Results</title><p>Our results will provide a validated reporting guideline for studies on clinical IE. A preliminary set of 28 reporting items was drafted from a scoping review and existing frameworks. The draft guidelines include 5 key dimensions: information model, architecture, data, annotation, and outcome. This draft guideline will be refined through the eDelphi process. It is designed to be technology-agnostic and applicable across diverse IE approaches, including not only large language models but also traditional machine learning methods and rule-based and hybrid systems.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>The CINEX guideline provides structured, expert-validated guidance for reporting clinical IE studies, improving transparency, reproducibility, and comparability. The final guideline will be disseminated alongside an explanatory document to support adoption and implementation.</p></sec><sec sec-type="registered-report"><title>International Registered Report Identifier (IRRID)</title><p>PRR1-10.2196/76776</p></sec></abstract><kwd-group><kwd>reporting guideline</kwd><kwd>information extraction</kwd><kwd>artificial intelligence</kwd><kwd>natural language processing</kwd><kwd>consensus-based approach</kwd><kwd>eDelphi study</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Information extraction (IE) refers to techniques that automatically identify and structure key information from unstructured text. These methods enable efficient reuse of clinical narratives, supporting decision-making, research, and automation in electronic health records. Specific use cases include phenotyping (eg, extraction of specific diseases), drug-related tasks (eg, dosage IE), and clinical workflow optimization (eg, adverse event detection) [<xref ref-type="bibr" rid="ref1">1</xref>]. Furthermore, IE can reduce the burden of manual chart review, enable large-scale epidemiological studies, and support real-time decision support.</p><p>Recent advances in natural language processing (NLP), especially through large language models (LLMs), have improved IE capabilities. However, this rapid technical evolution has introduced fragmentation in methods, terminology, and evaluation. We identified this heterogeneity during a scoping review of studies describing IE specifically from radiology reports. Studies vary widely in defining the target information, annotating reference standards, evaluating system performance, and disclosing implementation details [<xref ref-type="bibr" rid="ref2">2</xref>]. Without standardized reporting, it becomes difficult to interpret results, compare systems, replicate experiments, or translate the developed effective algorithms into clinical practice. This suboptimal reporting quality had already been identified in a systematic review conducted by Davidson et al [<xref ref-type="bibr" rid="ref3">3</xref>] in 2021.</p><p>To address reporting variability in artificial intelligence (AI) studies, several guidelines have emerged. The CONSORT-AI (Consolidated Standards of Reporting Trials&#x2013;Artificial Intelligence) extension provides a checklist for reporting clinical trials that include AI-based interventions [<xref ref-type="bibr" rid="ref4">4</xref>]. Its counterpart, SPIRIT-AI (Standard Protocol Items: Recommendations for Interventional Trials&#x2013;Artificial Intelligence), focuses on protocol reporting for such trials, ensuring clarity and completeness before trial execution [<xref ref-type="bibr" rid="ref5">5</xref>]. More recently, TRIPOD+AI (Transparent Reporting of a multivariable prediction model for Individual Prognosis Or Diagnosis&#x2013;Artificial Intelligence) [<xref ref-type="bibr" rid="ref6">6</xref>] and TRIPOD-LLM (Transparent Reporting of a Multivariable Prediction Model for Individual Prognosis Or Diagnosis specifically tailored for large language models) [<xref ref-type="bibr" rid="ref7">7</xref>] have extended the original TRIPOD (Transparent Reporting of a Multivariable Prediction Model for Individual Prognosis Or Diagnosis) [<xref ref-type="bibr" rid="ref8">8</xref>] guidelines to include the application of regression and machine learning methods as well as LLM-based approaches for prediction model studies. These guidelines promote transparency and reproducibility for studies describing AI-based interventions and prediction models. However, none are applicable to the reporting needs of IE from clinical text, which involves distinct tasks, input-output structures, and evaluation methods as compared to diagnostic modeling or intervention and their associated trials.</p><p>This paper presents the protocol for the development of the Clinical Information Extraction (CINEX) guideline, a consensus-based reporting guideline for clinical IE studies. This protocol outlines the methodology behind the CINEX guideline, including a 3-round modified electronic Delphi (eDelphi) process with domain experts. The development of this guideline follows best practices for health research reporting and includes steps for item refinement, a final in-person consensus meeting, and the publication of an explanation and elaboration (E&#x0026;E) document. The CINEX guideline aims to close the reporting gap in clinical IE research, promoting rigor, transparency, and harmonization across diverse methodological paradigms.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Overview and Preliminary Guideline Development</title><p>The planned development process of the CINEX guideline was registered and publicly listed with the EQUATOR (Enhancing the Quality and Transparency Of Health Research) Network as a reporting guideline under development in August 2024 prior to its official start in October 2024 [<xref ref-type="bibr" rid="ref9">9</xref>]. The EQUATOR Network is an international initiative that promotes transparent and accurate reporting of health research to improve the reliability and value of the published literature [<xref ref-type="bibr" rid="ref10">10</xref>]. The CINEX guideline follows the methodological guidance outlined by Moher et al [<xref ref-type="bibr" rid="ref11">11</xref>] for developing health research reporting guidelines. Throughout this protocol, references to Moher&#x2019;s checklist items are indicated in angle brackets (&#x003C; &#x003E;).</p><p>The need for this guideline was identified during a scoping review of studies on LLM-based IE from radiology reports &#x003C;1&#x003E; [<xref ref-type="bibr" rid="ref2">2</xref>]. The review aimed to assess the current state of the art in terms of performance, training and modeling approaches, clinical use cases, datasets, annotation methods, and commonly reported challenges. Derived from the review&#x2019;s aims, a data extraction table was drafted and populated by one author. The scoping review revealed important barriers to study comparability, including untransparent performance metric calculations, lack of external validation, and limited availability of source code. These problems hinder transparency and reproducibility in the field. Based on the data extraction table as well as inspired by existing reporting guidelines, an initial set of 28 candidate reporting items was drafted and published &#x003C;2&#x003E; [<xref ref-type="bibr" rid="ref12">12</xref>].</p></sec><sec id="s2-2"><title>eDelphi Study</title><p>To refine the preliminary guideline, a 3-round eDelphi study was planned between May and July 2025 &#x003C;5,6&#x003E;. The Delphi method was chosen as a structured, iterative process to achieve expert consensus, in line with the recommendations of Moher et al [<xref ref-type="bibr" rid="ref11">11</xref>] for reporting guideline development.</p><p>We designed the eDelphi process based on the methodological principles of H&#x00E4;der [<xref ref-type="bibr" rid="ref13">13</xref>], Nasa et al [<xref ref-type="bibr" rid="ref14">14</xref>], as well as Trevelyan and Robinson [<xref ref-type="bibr" rid="ref15">15</xref>]. We aim to recruit between 20 and 30 participants &#x003C;4&#x003E;. Minimum response rates are set at 30% for the first round and 70% for the following rounds, consistent with H&#x00E4;der&#x2019;s [<xref ref-type="bibr" rid="ref13">13</xref>] guidance.</p><p>Eligible participants include the authors of studies identified in the preceding scoping review, as well as domain experts with regard to clinical IE, recruited through the personal and professional networks of the executive committee. Interested individuals will be invited via email to join the study. The survey itself will be conducted using the open-source tool LimeSurvey [<xref ref-type="bibr" rid="ref16">16</xref>].</p><p>The eDelphi study will comprise exactly 3 rounds [<xref ref-type="bibr" rid="ref13">13</xref>]. Consensus for the inclusion of an item in the guideline will be defined as a mean rating of 8 or higher on a 10-point scale, with an SD of 2 or less. Exclusion will be defined as a mean rating of 3 or lower, also with an SD of &#x2264;2. Items falling outside these thresholds will be revisited during a final consensus meeting held after the eDelphi process. Response stability is recorded but not used to assess early termination. Only in the first round, panelists have the possibility to add additional items for each domain. Exclusion as well as finalization due to consensus of items is only conducted after rounds 2 and 3. Rephrasing of items and descriptions is conducted after each round based on the panelists&#x2019; comments.</p><p>In the first round, participants will be presented with the draft reporting items, including any proposed value sets where applicable. They will be asked to assess the relevance and maturity of each item using a 10-point scale with labeled endpoints only (&#x201C;not at all relevant&#x201D; and &#x201C;not at all mature&#x201D; to &#x201C;very relevant&#x201D; and &#x201C;very mature&#x201D;). Each item additionally includes a default &#x201C;No answer&#x201D; option. To approximate interval-level data, a larger number of anchor points was selected instead of a classical 5-point scale based on methodological recommendations [<xref ref-type="bibr" rid="ref17">17</xref>]. To exclude or include (finalize) an item, the abovementioned mean and SD thresholds must be met for both relevance and maturity.</p><p>Feedback will be proactively provided by the executive committee for each new round (active feedback loop): participants re-evaluate items that were not excluded, assisted by aggregated ratings of the whole panel (as histograms), moderated anonymized comments from the previous round, and their own previous ratings. This format enables reflection and informed re-evaluation.</p><p>Besides participating in the eDelphi panel, each expert completes a self-disclosure of their expertise in clinical IE. Consistent with H&#x00E4;der [<xref ref-type="bibr" rid="ref13">13</xref>], no demographic data will be collected beyond gender and country of affiliation. Anonymity among participants will be preserved throughout the eDelphi panel. At the end of the first round, participants will be invited to indicate whether they wish to participate in the final consensus meeting taking place after the completion of the third round and to contribute to the final publication of the CINEX guideline and the explanatory document.</p><p>A pretest of the first-round survey will be conducted among the executive committee (comprising authors DR, HM, and KD) to ensure clarity and functionality. These individuals will not participate in the actual eDelphi rounds.</p></sec><sec id="s2-3"><title>Consensus Meeting, Finalization, and Outlook</title><p>For the final step of the guideline development process, a face-to-face hybrid consensus meeting is conducted, organized as a workshop at the MEDINFO conference in August 2025 &#x003C;6,7,8&#x003E;. During the workshop, the results of the Delphi process are presented, and items that achieved consensus are reviewed for resolving minor ambiguities and final phrasing. Items without prior agreement are discussed and, if needed, resolved by open voting. Consensus is defined as &#x2265;80% agreement. The meeting is considered quorate if &#x2265;50% of the panelists of the first round of the eDelphi panel are present. Persistent disagreements will be documented and reported transparently in the publication of the final guideline. The workshop shall result in the formal finalization of the CINEX guideline; thereafter, the guidance statement is finalized &#x003C;9&#x003E;, complemented by an E&#x0026;E document &#x003C;10&#x003E;, and both are made available as publication &#x003C;11&#x003E;. The guideline development process will be reported in a structured way in accordance with the Accurate Consensus Reporting Document (ACCORD) reporting guideline [<xref ref-type="bibr" rid="ref18">18</xref>].</p><p>Responsibilities for postpublication activities &#x003C;12&#x2010;18&#x003E; are divided among the contributing authors: the CINEX guideline will be hosted on an open access online platform for ongoing feedback &#x003C;12,14,16&#x003E;, will be pilot-tested by panelists, and its impact on reporting quality will be evaluated. To ensure durability, an executive group will review the CINEX guideline at regular 3-year intervals, evaluating its impact &#x003C;15&#x003E; and issuing updates when new evidence or methods make a revision necessary &#x003C;18&#x003E;. We seek endorsement from journals and societies &#x003C;13&#x003E;. Translation is not planned for the initial release &#x003C;17&#x003E;. By following these postpublication activities, we aim at establishing a long-term relevance of the CINEX guideline.</p></sec><sec id="s2-4"><title>Ethical Considerations</title><p>This study was granted an exemption by the competent ethics committee of the canton of Bern on April 29, 2025 (ID: Req-2025&#x2010;00587). All eDelphi study participants gave electronic informed consent prior to participation.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><p>A preliminary guideline comprising 28 items and 5 dimensions (information model, architecture, data, annotation, and outcome) was published in August 2024 [<xref ref-type="bibr" rid="ref12">12</xref>]. These items will be presented in the first round of the eDelphi study.</p></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Results</title><p>This protocol presents the development of the CINEX guideline, a reporting guideline specifically developed for clinical IE studies. The CINEX guideline addresses key challenges in the field&#x2014;including inconsistent terminology, reporting, and evaluation&#x2014;by providing a structured, technology-agnostic framework tailored to IE tasks in health care. By design, the CINEX guideline accommodates both rule-based and data-driven approaches, including LLM-based methods by focusing on essential reporting dimensions (eg, data sources, annotation strategies, information model, and evaluation metrics) that apply across paradigms. This ensures that differences in implementation, such as rule-based extraction pipelines or end-to-end architectures, can be transparently described and compared within a shared reporting structure. To facilitate adoption, we will pursue parallel endorsement of the CINEX guideline by multiple journals in biomedical informatics, promote its use by providing an online website (inspired by TRIPOD-LLM [<xref ref-type="bibr" rid="ref7">7</xref>]), and invite panelists to apply the CINEX guideline in their own research.</p></sec><sec id="s4-2"><title>Limitations</title><p>Our approach has several limitations. First, the development process for the CINEX guideline is based on guidance for reporting guideline development in health research as outlined by Moher et al [<xref ref-type="bibr" rid="ref11">11</xref>]. While the CINEX guideline addresses health-related research, it also intersects significantly with the computer science domain. Currently, however, there are no methodological frameworks for reporting guideline development in computer science. Given this gap, we adopted the framework of Moher et al [<xref ref-type="bibr" rid="ref11">11</xref>], which is well-established and has informed the development of most reporting guidelines endorsed by the EQUATOR Network, including guidelines with a technical focus (eg, CONSORT-AI). Nonetheless, we acknowledge that this choice may not fully capture disciplinary nuances outside the health sciences. The CINEX guideline will therefore be developed with input from the computer sciences as well as clinical disciplines and be tested for clarity and relevance in both contexts.</p><p>Participant recruitment relies partly on professional networks, which may limit diversity. While consensus thresholds and item rating methods are clearly defined a priori with this protocol, they remain subjective to a certain degree. The final in-person consensus meeting, although valuable for discussion, may introduce social influence and new opinions from participants that have not participated in the eDelphi panel. Additionally, the CINEX may require future updates to accommodate rapid developments in LLMs and multimodal approaches.</p></sec><sec id="s4-3"><title>Comparison With Prior Work</title><p>The CINEX guideline builds on the methods used in guidelines like CONSORT-AI, SPIRIT-AI, and TRIPOD-LLM and is the first to focus specifically on clinical IE. Our study design incorporated detailed feedback loops and a 10-point scale instead of a 5-point scale aiming to improve rating precision. While existing AI guidelines address broader study types, none are tailored to the unique needs of clinical text-based IE, underscoring the CINEX guideline&#x2019;s distinct contribution. Furthermore, we seek to address the challenges faced by prior reporting guidelines: first, adoption and enforcement by journals have often been inconsistent, thus limiting their impact; to mitigate this, we will accompany the CINEX guideline with an online template checklist for authors and actively engage journals to encourage endorsement. Second, ambiguity in checklist items has been a barrier to compliance; therefore, the CINEX guideline will be supported by a detailed E&#x0026;E document. Third, the CINEX guideline will include example items tailored for computer science as well as medical audiences, supporting broader adoption across disciplines.</p></sec><sec id="s4-4"><title>Conclusions</title><p>The CINEX guideline fills a critical gap in the reporting of clinical IE studies by offering a dedicated, consensus-driven framework. It aims to improve reproducibility, comparability, and transparency in this growing area of clinical NLP. Continued community involvement and iterative updates will be essential to ensure its ongoing relevance.</p></sec></sec></body><back><ack><p>The CINEX (Clinical Information Extraction) guideline is part of a PhD project at the University of Geneva. No dedicated funding was obtained. Generative AI (ChatGPT [GPT-4o and GPT-5] OpenAI) was used to assist with language editing of the manuscript draft and improve clarity and formatting of responses to peer review comments. No artificial intelligence tool was used to generate original scientific content. All content was reviewed and approved by the authors.</p></ack><fn-group><fn fn-type="con"><p>Conceptualization: DR and KD</p><p>Methodology: DR</p><p>Supervision: HM and KD</p><p>Writing&#x2014;original draft: DR</p><p>Writing&#x2014;review and editing: DR, HM, and KD</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">ACCORD</term><def><p>Accurate Consensus Reporting Document</p></def></def-item><def-item><term id="abb2">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb3">CINEX</term><def><p>Clinical Information Extraction</p></def></def-item><def-item><term id="abb4">CONSORT-AI</term><def><p>Consolidated Standards of Reporting Trials&#x2013;Artificial Intelligence</p></def></def-item><def-item><term id="abb5">E&#x0026;E</term><def><p>explanation and elaboration</p></def></def-item><def-item><term id="abb6">eDelphi</term><def><p>electronic Delphi</p></def></def-item><def-item><term id="abb7">EQUATOR</term><def><p>Enhancing the Quality and Transparency Of Health Research</p></def></def-item><def-item><term id="abb8">IE</term><def><p>information extraction</p></def></def-item><def-item><term id="abb9">LLM</term><def><p>large language model</p></def></def-item><def-item><term id="abb10">NLP</term><def><p>natural language processing</p></def></def-item><def-item><term id="abb11">SPIRIT-AI</term><def><p>Standard Protocol Items: Recommendations for Interventional Trials&#x2013;Artificial Intelligence</p></def></def-item><def-item><term id="abb12">TRIPOD+AI</term><def><p>Transparent Reporting of a multivariable prediction model for Individual Prognosis Or Diagnosis&#x2013;Artificial Intelligence</p></def></def-item><def-item><term id="abb13">TRPIOD-LLM</term><def><p>Transparent Reporting of a Multivariable Prediction Model for Individual Prognosis Or Diagnosis specifically tailored for large language models</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>L</given-names> </name><name name-style="western"><surname>Rastegar-Mojarad</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Clinical information extraction applications: A literature review</article-title><source>J Biomed Inform</source><year>2018</year><month>01</month><volume>77</volume><fpage>34</fpage><lpage>49</lpage><pub-id pub-id-type="doi">10.1016/j.jbi.2017.11.011</pub-id><pub-id pub-id-type="medline">29162496</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Reichenpfader</surname><given-names>D</given-names> </name><name name-style="western"><surname>M&#x00FC;ller</surname><given-names>H</given-names> </name><name name-style="western"><surname>Denecke</surname><given-names>K</given-names> </name></person-group><article-title>A scoping review of large language model based approaches for information extraction from radiology reports</article-title><source>NPJ Digit Med</source><year>2024</year><month>08</month><day>24</day><volume>7</volume><issue>1</issue><fpage>222</fpage><pub-id pub-id-type="doi">10.1038/s41746-024-01219-0</pub-id><pub-id pub-id-type="medline">39182008</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Davidson</surname><given-names>EM</given-names> </name><name name-style="western"><surname>Poon</surname><given-names>MTC</given-names> </name><name name-style="western"><surname>Casey</surname><given-names>A</given-names> </name><etal/></person-group><article-title>The reporting quality of natural language processing studies: systematic review of studies of radiology reports</article-title><source>BMC Med Imaging</source><year>2021</year><month>10</month><day>2</day><volume>21</volume><issue>1</issue><fpage>142</fpage><pub-id pub-id-type="doi">10.1186/s12880-021-00671-8</pub-id><pub-id pub-id-type="medline">34600486</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>X</given-names> </name><name name-style="western"><surname>Cruz Rivera</surname><given-names>S</given-names> </name><name name-style="western"><surname>Moher</surname><given-names>D</given-names> </name><name name-style="western"><surname>Calvert</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Denniston</surname><given-names>AK</given-names> </name><collab>SPIRIT-AI and CONSORT-AI Working Group</collab></person-group><article-title>Reporting guidelines for clinical trial reports for interventions involving artificial intelligence: the CONSORT-AI extension</article-title><source>Nat Med</source><year>2020</year><month>09</month><volume>26</volume><issue>9</issue><fpage>1364</fpage><lpage>1374</lpage><pub-id pub-id-type="doi">10.1038/s41591-020-1034-x</pub-id><pub-id pub-id-type="medline">32908283</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cruz Rivera</surname><given-names>S</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>X</given-names> </name><name name-style="western"><surname>Chan</surname><given-names>AW</given-names> </name><etal/></person-group><article-title>Guidelines for clinical trial protocols for interventions involving artificial intelligence: the SPIRIT-AI extension</article-title><source>Nat Med</source><year>2020</year><month>09</month><volume>26</volume><issue>9</issue><fpage>1351</fpage><lpage>1363</lpage><pub-id pub-id-type="doi">10.1038/s41591-020-1037-7</pub-id><pub-id pub-id-type="medline">32908284</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Collins</surname><given-names>GS</given-names> </name><name name-style="western"><surname>Moons</surname><given-names>KGM</given-names> </name><name name-style="western"><surname>Dhiman</surname><given-names>P</given-names> </name><etal/></person-group><article-title>TRIPOD+AI statement: updated guidance for reporting clinical prediction models that use regression or machine learning methods</article-title><source>BMJ</source><year>2024</year><month>04</month><day>16</day><volume>385</volume><fpage>e078378</fpage><pub-id pub-id-type="doi">10.1136/bmj-2023-078378</pub-id><pub-id pub-id-type="medline">38626948</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gallifant</surname><given-names>J</given-names> </name><name name-style="western"><surname>Afshar</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ameen</surname><given-names>S</given-names> </name><etal/></person-group><article-title>The TRIPOD-LLM reporting guideline for studies using large language models</article-title><source>Nat Med</source><year>2025</year><month>01</month><volume>31</volume><issue>1</issue><fpage>60</fpage><lpage>69</lpage><pub-id pub-id-type="doi">10.1038/s41591-024-03425-5</pub-id><pub-id pub-id-type="medline">39779929</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Collins</surname><given-names>GS</given-names> </name><name name-style="western"><surname>Reitsma</surname><given-names>JB</given-names> </name><name name-style="western"><surname>Altman</surname><given-names>DG</given-names> </name><name name-style="western"><surname>Moons</surname><given-names>KGM</given-names> </name></person-group><article-title>Transparent reporting of a multivariable prediction model for individual prognosis or diagnosis (TRIPOD): the TRIPOD Statement</article-title><source>BMC Med</source><year>2015</year><month>01</month><day>6</day><volume>13</volume><issue>1</issue><fpage>1</fpage><pub-id pub-id-type="doi">10.1186/s12916-014-0241-z</pub-id><pub-id pub-id-type="medline">25563062</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="web"><article-title>Reporting guidelines under development for other study designs</article-title><source>The EQUATOR Network</source><year>2024</year><access-date>2025-09-18</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.equator-network.org/library/reporting-guidelines-under-development/reporting-guidelines-under-development-for-other-study-designs/#CINEX">https://www.equator-network.org/library/reporting-guidelines-under-development/reporting-guidelines-under-development-for-other-study-designs/#CINEX</ext-link></comment></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="web"><article-title>About us</article-title><source>The EQUATOR Network</source><year>2025</year><access-date>2025-09-18</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.equator-network.org/about-us/">https://www.equator-network.org/about-us/</ext-link></comment></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moher</surname><given-names>D</given-names> </name><name name-style="western"><surname>Schulz</surname><given-names>KF</given-names> </name><name name-style="western"><surname>Simera</surname><given-names>I</given-names> </name><name name-style="western"><surname>Altman</surname><given-names>DG</given-names> </name></person-group><article-title>Guidance for developers of health research reporting guidelines</article-title><source>PLoS Med</source><year>2010</year><month>02</month><day>16</day><volume>7</volume><issue>2</issue><fpage>e1000217</fpage><pub-id pub-id-type="doi">10.1371/journal.pmed.1000217</pub-id><pub-id pub-id-type="medline">20169112</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Reichenpfader</surname><given-names>D</given-names> </name><name name-style="western"><surname>Denecke</surname><given-names>K</given-names> </name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Mantas</surname><given-names>J</given-names> </name><name name-style="western"><surname>Hasman</surname><given-names>A</given-names> </name><name name-style="western"><surname>Demiris</surname><given-names>G</given-names> </name><name name-style="western"><surname>Saranto</surname><given-names>K</given-names> </name><name name-style="western"><surname>Marschollek</surname><given-names>M</given-names> </name><name name-style="western"><surname>Arvanitis</surname><given-names>TN</given-names> </name><name name-style="western"><surname>Ognjanovi&#x0107;</surname><given-names>I</given-names> </name><name name-style="western"><surname>Benis</surname><given-names>A</given-names> </name><name name-style="western"><surname>Gallos</surname><given-names>P</given-names> </name><name name-style="western"><surname>Zoulias</surname><given-names>E</given-names> </name><name name-style="western"><surname>Andrikopoulou</surname><given-names>E</given-names> </name></person-group><article-title>Towards a reporting guideline for studies on information extraction from clinical texts</article-title><source>Stud Health Technol Inform</source><year>2024</year><publisher-name>IOS Press</publisher-name><pub-id pub-id-type="doi">10.3233/SHTI240744</pub-id><pub-id pub-id-type="other">978-1-64368-533-5</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>H&#x00E4;der</surname><given-names>M</given-names> </name></person-group><source>Delphi-Befragungen: Ein Arbeitsbuch</source><year>2014</year><publisher-name>Springer Fachmedien</publisher-name><pub-id pub-id-type="doi">10.1007/978-3-658-01928-0</pub-id><pub-id pub-id-type="other">978-3-658-01927-3</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nasa</surname><given-names>P</given-names> </name><name name-style="western"><surname>Jain</surname><given-names>R</given-names> </name><name name-style="western"><surname>Juneja</surname><given-names>D</given-names> </name></person-group><article-title>Delphi methodology in healthcare research: How to decide its appropriateness</article-title><source>World J Methodol</source><year>2021</year><month>07</month><day>20</day><volume>11</volume><issue>4</issue><fpage>116</fpage><lpage>129</lpage><pub-id pub-id-type="doi">10.5662/wjm.v11.i4.116</pub-id><pub-id pub-id-type="medline">34322364</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Trevelyan</surname><given-names>EG</given-names> </name><name name-style="western"><surname>Robinson</surname><given-names>PN</given-names> </name></person-group><article-title>Delphi methodology in health research: how to do it?</article-title><source>Eur J Integr Med</source><year>2015</year><month>08</month><volume>7</volume><issue>4</issue><fpage>423</fpage><lpage>428</lpage><pub-id pub-id-type="doi">10.1016/j.eujim.2015.07.002</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="web"><article-title>LimeSurvey: an open source survey tool hamburg</article-title><source>LimeSurvey GmbH</source><year>2024</year><access-date>2025-09-18</access-date><comment><ext-link ext-link-type="uri" xlink:href="http://www.limesurvey.org">http://www.limesurvey.org</ext-link></comment></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wu</surname><given-names>H</given-names> </name><name name-style="western"><surname>Leung</surname><given-names>SO</given-names> </name></person-group><article-title>Can Likert scales be treated as interval scales?&#x2014;A simulation study</article-title><source>J Soc Serv Res</source><year>2017</year><month>08</month><day>8</day><volume>43</volume><issue>4</issue><fpage>527</fpage><lpage>532</lpage><pub-id pub-id-type="doi">10.1080/01488376.2017.1329775</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gattrell</surname><given-names>WT</given-names> </name><name name-style="western"><surname>Logullo</surname><given-names>P</given-names> </name><name name-style="western"><surname>van Zuuren</surname><given-names>EJ</given-names> </name><etal/></person-group><article-title>ACCORD (ACcurate COnsensus Reporting Document): A reporting guideline for consensus methods in biomedicine developed via a modified Delphi</article-title><source>PLOS Med</source><year>2024</year><month>01</month><day>23</day><volume>21</volume><issue>1</issue><fpage>e1004326</fpage><pub-id pub-id-type="doi">10.1371/journal.pmed.1004326</pub-id></nlm-citation></ref></ref-list></back></article>