<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Res Protoc</journal-id><journal-id journal-id-type="publisher-id">ResProt</journal-id><journal-id journal-id-type="index">5</journal-id><journal-title>JMIR Research Protocols</journal-title><abbrev-journal-title>JMIR Res Protoc</abbrev-journal-title><issn pub-type="epub">1929-0748</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v15i1e86425</article-id><article-id pub-id-type="doi">10.2196/86425</article-id><article-categories><subj-group subj-group-type="heading"><subject>Protocol</subject></subj-group></article-categories><title-group><article-title>A Natural Language Processing Framework for Structuring and Visualizing Clinical Trial Eligibility Criteria at Scale: Protocol for a Quantitative Study</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Xie</surname><given-names>Justin</given-names></name><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Parikh</surname><given-names>Jeet</given-names></name><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Liu</surname><given-names>Jessica</given-names></name><degrees>BS</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Pandya</surname><given-names>Sameer</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Gong</surname><given-names>Guannan</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib></contrib-group><aff id="aff1"><institution>Yale College, Yale University</institution><addr-line>New Haven</addr-line><addr-line>CT</addr-line><country>United States</country></aff><aff id="aff2"><institution>Yale Cancer Center, Yale School of Medicine</institution><addr-line>333 Cedar Street</addr-line><addr-line>New Haven</addr-line><addr-line>CT</addr-line><country>United States</country></aff><aff id="aff3"><institution>Department of Laboratory Medicine, Yale School of Medicine</institution><addr-line>New Haven</addr-line><addr-line>CT</addr-line><country>United States</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Sarvestan</surname><given-names>Javad</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Wyatt</surname><given-names>Kirk D</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Guannan Gong, PhD, Yale Cancer Center, Yale School of Medicine, 333 Cedar Street, New Haven, CT, 06510, United States, 1 203-200-2328; <email>guannan.gong@yale.edu</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>14</day><month>5</month><year>2026</year></pub-date><volume>15</volume><elocation-id>e86425</elocation-id><history><date date-type="received"><day>23</day><month>10</month><year>2025</year></date><date date-type="rev-recd"><day>11</day><month>03</month><year>2026</year></date><date date-type="accepted"><day>12</day><month>03</month><year>2026</year></date></history><copyright-statement>&#x00A9; Justin Xie, Jeet Parikh, Jessica Liu, Sameer Pandya, Guannan Gong. Originally published in JMIR Research Protocols (<ext-link ext-link-type="uri" xlink:href="https://www.researchprotocols.org">https://www.researchprotocols.org</ext-link>), 14.5.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Research Protocols, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.researchprotocols.org">https://www.researchprotocols.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://www.researchprotocols.org/2026/1/e86425"/><abstract><sec><title>Background</title><p>Eligibility criteria are essential to clinical trial design, guiding recruitment, and ensuring patient safety and scientific rigor. However, criteria are often lengthy, heterogeneous, and inconsistently formatted, which hinders large-scale interpretation and slows patient-trial matching. Manual review is time-consuming and error-prone. Advances in natural language processing and large language models (LLMs) offer opportunities to standardize and analyze eligibility text at scale.</p></sec><sec><title>Objective</title><p>This study aims to develop and evaluate a scalable system that uses LLM-enabled natural language processing and unsupervised learning to identify, normalize, categorize, and visualize clinical trial eligibility criteria, with the goal of improving patient-trial matching and revealing domain-level trends.</p></sec><sec sec-type="methods"><title>Methods</title><p>We designed a three-part pipeline: (1) representation of eligibility text using embeddings, followed by clustering to group semantically similar criteria; (2) dual-layer zero-shot LLM summarization for concept normalization, refinement, and deduplication of cluster exemplars; and (3) an interactive, web-based visualization interface to explore criteria distributions and trends by disease domain and over time. The pipeline was applied to 53,872 oncology trials (breast, lung, and gastrointestinal cancer) indexed on ClinicalTrials.gov. Outputs include cluster labels, normalized criterion summaries, and per-domain frequency profiles. Feasibility was assessed via successful end-to-end processing and inspection of face validity for cluster coherence and domain-specific patterns.</p></sec><sec sec-type="results"><title>Results</title><p>The system successfully processed all 53,872 trials and generated stable clusters of inclusion and exclusion concepts. The LLM summarization layers produced concise, nonredundant labels that improved the interpretability of clustered criteria. The visualization interface enabled rapid exploration of cross-trial patterns and temporal trends within breast, lung, and gastrointestinal oncology, facilitating identification of common inclusion requirements and potential barriers to enrollment. A public, open-source demonstration instance allows for interactive exploration of these clusters and summaries. Benchmarking through human validation on a random sample of eligibility criteria found the system to be 94% (470/500) accurate, reflecting its ability to consistently categorize criteria correctly in congruence with human judgment.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>A combined embeddings-clustering-LLM pipeline can standardize heterogeneous eligibility text and surface domain-level patterns at scale. This framework provides a foundation for accelerating patient-trial matching and informing future trial design. While the current implementation was evaluated on ClinicalTrials.gov oncology trials, the approach is readily generalizable to additional diseases and alternative modeling configurations.</p></sec><sec sec-type="registered-report"><title>International Registered Report Identifier (IRRID)</title><p>DERR1-10.2196/86425</p></sec></abstract><kwd-group><kwd>eligibility determination</kwd><kwd>clinical trials as topic</kwd><kwd>natural language processing</kwd><kwd>large language models</kwd><kwd>machine learning</kwd><kwd>data visualization</kwd><kwd>cluster analysis</kwd><kwd>breast neoplasms</kwd><kwd>lung neoplasms</kwd><kwd>gastrointestinal neoplasms</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Background and Significance</title><p>Eligibility criteria are fundamental to clinical trial design, serving as the basis for patient recruitment and ensuring participant safety [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. However, these criteria are often written in heterogeneous and semistructured formats across protocols, making automated interpretation and matching challenging [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. Traditionally, assessing patient eligibility requires manual chart review&#x2014;a time-consuming and error-prone process that contributes to screening inefficiencies and delays in trial enrollment [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. To address this, automated systems have been developed to streamline patient-trial matching by extracting and standardizing relevant data from electronic health records [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref9">9</xref>].</p><p>Recent advancements in natural language processing (NLP) and large language models (LLMs) have created new opportunities for improving automated clinical trial matching systems and reducing recruitment timelines [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref13">13</xref>]. Foundational transformer-based and LLM architectures have demonstrated strong capabilities in clinical and biomedical language understanding [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref17">17</xref>], including medical question answering and licensing examinations [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>], information extraction [<xref ref-type="bibr" rid="ref20">20</xref>], and medical-oriented conversational systems [<xref ref-type="bibr" rid="ref21">21</xref>]. LLMs have increasingly served as a backbone for automated patient-trial matching approaches [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>].</p><p>Despite these advances, a critical gap remains: the absence of a unified framework for normalizing, summarizing, and benchmarking eligibility criteria at scale [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. Without systematic normalization, trial designers cannot easily compare their criteria against prevailing standards, potentially leading to overly restrictive eligibility definitions that may limit accrual and reduce generalizability [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref25">25</xref>].</p><p>To address this need, we developed an LLM-enabled NLP and unsupervised learning system designed to summarize frequently used eligibility concepts, identify emerging trends, and support evidence-informed protocol design. In practice, this tool functions as a decision support platform for protocol optimization, enabling researchers to detect redundant or &#x201C;outlier&#x201D; criteria that may unnecessarily constrain the eligible patient population. Furthermore, it addresses infrastructure scalability challenges by introducing a standardized concept representation layer that facilitates cross-trial interoperability without manual reconfiguration.</p><p>Our prototype features a three-part architecture: (1) extraction and embedding of eligibility criteria, (2) unsupervised clustering with dual-layer LLM summarization, and (3) an interactive web-based exploration interface. This system provides researchers with an intuitive platform for analyzing patterns in clinical trial design and supporting scalable, model-driven enhancements to automated trial matching infrastructure.</p></sec><sec id="s1-2"><title>Study Objectives</title><p>In this study, we introduce a novel system that leverages foundational language models to identify, categorize, summarize, and visualize clinical trial eligibility criteria across disease domains. Our approach is tailored to the analysis of clinical trial protocols with the goal of improving automated patient matching and informing future trial design.</p></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Overview</title><p>We developed a novel, scalable system for categorizing and visualizing clusters of clinical trial eligibility criteria with the aim of identifying recurring patterns across disease domains. The system has 3 components: unsupervised clustering of semantically similar criteria, LLM-based summarization, and an interactive visualization interface. For feasibility, we prototyped the system using clinical trial data from breast, lung, and gastrointestinal (GI) oncology. The visualization tool enables users to explore and interact with eligibility criteria clusters through features such as dynamic highlighting, panning, zooming, and time-based filtering. This allows for temporal analysis of how eligibility criteria evolve, offering new insights into clinical trial design trends across oncology subtypes.</p><p>The data used in this study were extracted from ClinicalTrials.gov via the application programming interface (API). Text embeddings were obtained through the <italic>text-embedding-3-large</italic> embeddings model. Clustering was completed through the k-means algorithm provided by the open-source scikit-learn library (Google Summer of Code project). Summarization was achieved through the LLM GPT-4o (OpenAI) via API. All data transmitted to external APIs consisted solely of deidentified, publicly available eligibility criteria text. No trial identifiers, patient-level data, or personal health information were included.</p></sec><sec id="s2-2"><title>Data Sources</title><p>Clinical trial data were extracted from ClinicalTrials.gov via the API for 3 oncology domains: breast cancer, lung cancer, and GI cancer. Disease-specific keywords (&#x201C;breast cancer,&#x201D; &#x201C;lung cancer,&#x201D; and &#x201C;GI oncology&#x201D;) were used to retrieve relevant trial information&#x2014;including National Clinical Trial ID, eligibility criteria text, trial sponsor, sponsor type, and trial start date. Only trials containing complete data across all required fields were included in the analysis. All open or enrolling and closed trials were considered part of the initial dataset. The final dataset comprised 53,872 oncology trials, including 14,222 breast cancer trials, 15,624 lung cancer trials, and 24,026 GI oncology trials. These records served as the foundation for subsequent preprocessing, clustering, and analysis.</p></sec><sec id="s2-3"><title>Data Preprocessing</title><p>Given that the focus of this study was on industry eligibility criteria, analyses were restricted to industry-sponsored trials listed on ClinicalTrials.gov to maintain consistency in reporting structure and formatting. As a result, the datasets were refined to 3108 breast cancer trials, 4470 lung cancer trials, and 4539 GI oncology trials.</p><p>The second stage involved isolating inclusion criteria. Inclusion criteria were prioritized over exclusion criteria because inclusion criteria are more directly relevant to patient-trial matching. Additionally, merging both criterion types in a single analysis could lead to confusion in interpretation for end users. Thus, our system was designed to process both types independently, allowing for more interpretable clustering results.</p><p>In the final preprocessing step, we transformed the unstructured eligibility criteria text from ClinicalTrials.gov into a structured, line-by-line format suitable for downstream analysis. While most trials presented criteria as bullet points, formatting varied considerably across entries. We applied a series of regular expression filters to normalize the text&#x2014;removing extraneous characters, bullet markers, line breaks, and indentation. This process yielded coherent lines of inclusion criteria, most of which reflected interpretable and meaningful content. The small subset of noisy or malformed entries was effectively neutralized through the clustering and summarization components later in the pipeline.</p><p>After preprocessing, the final datasets included 31,009 lines of inclusion criteria for breast cancer, 44,595 lines of inclusion criteria for lung cancer, and 42,555 lines of inclusion criteria for GI oncology. These were stored as structured CSV files, with each line of inclusion criteria linked to its corresponding National Clinical Trial ID and trial start date. A summary of dataset statistics is provided in <xref ref-type="table" rid="table1">Table 1</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Dataset statistics in stages of data preprocessing.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">Breast cancer, n</td><td align="left" valign="bottom">Lung cancer, n</td><td align="left" valign="bottom">GI<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> oncology, n</td></tr></thead><tbody><tr><td align="left" valign="top">Total trials (raw data)</td><td align="left" valign="top">14,222</td><td align="left" valign="top">15,624</td><td align="left" valign="top">24,026</td></tr><tr><td align="left" valign="top">Trials after industry filter</td><td align="left" valign="top">3108</td><td align="left" valign="top">4470</td><td align="left" valign="top">4539</td></tr><tr><td align="left" valign="top">Lines of inclusion criteria</td><td align="left" valign="top">31,009</td><td align="left" valign="top">44,595</td><td align="left" valign="top">42,555</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>GI: gastrointestinal.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-4"><title>System Summary</title><sec id="s2-4-1"><title>Overview</title><p>We developed a generalizable three-phase system designed to (1) embed and cluster, (2) summarize, and (3) visualize clinical trial eligibility criteria across disease domains. The pipeline is illustrated in <xref ref-type="fig" rid="figure1">Figure 1</xref>. The system uses text embeddings and an unsupervised learning model to extract eligibility criteria from clinical trial records and group trials by semantic similarity. To refine the clusters, we use a generative pretrained transformer&#x2013;based language model in a zero-shot setting, enabling 2 layers of summarization. The first layer summarizes the content within each cluster, whereas the second layer functions as a quality control mechanism, filtering duplicate, overly narrow, or irrelevant clusters to improve clarity and relevance. Inspired by MedViz&#x2014;a platform for visualizing medical literature [<xref ref-type="bibr" rid="ref26">26</xref>]&#x2014;the web interface supports visualization of criteria clusters over time and across disease domains, with features such as time-based filtering, dynamic cluster highlighting, and smart tooltips.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>System overview: phase 1 (embed and cluster), phase 2 (dual-layer large language model [LLM] summarization), and phase 3 (visualization). Regex: regular expression.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="resprot_v15i1e86425_fig01.png"/></fig></sec><sec id="s2-4-2"><title>Phase 1: Embed and Cluster</title><p>To semantically cluster and categorize the eligibility criteria data, we used OpenAI&#x2019;s <italic>text-embedding-3-large</italic> model to generate semantically accurate, 3072D vector embeddings for each criterion. To cluster, we used a k-means clustering algorithm from scikit-learn. A cluster count of 100 was selected based on a trade-off between thematic specificity and statistical robustness. Smaller cluster counts produced overly broad groupings that obscured emerging and specialized criteria such as biomarkers (eg, <italic>BRCA1</italic> or <italic>BRCA2</italic>), whereas larger counts fragmented semantically coherent groups and resulted in clusters with insufficient density for stable summarization. We found an effective balance at a <italic>K</italic> value of 100 between granularity and interpretability.</p><p>To further ensure robustness, clusters containing fewer than 100 inclusion criteria were excluded to avoid instability in similarity estimation and summarization. It should be noted that the visualization tool displays small-sized clusters but no information beyond their relationship to larger, relevant clusters. For the remaining clusters, we computed average intracluster cosine similarity and applied a threshold of 0.5 to enforce semantic coherence. As unsupervised clustering does not involve class labels, traditional class imbalance mitigation was not applicable. However, to address variability in cluster sizes, the minimum threshold of 100 inclusion criteria per cluster helped ensure that all retained clusters had sufficient density for stable summarization and reduce the influence of disproportionately small groupings on downstream analysis.</p><p>Due to the unsupervised learning approach and absence of ground-truth labels, conventional performance evaluation during training was not applicable. Instead, clustering performance was assessed post hoc through a human validation benchmark whereby independent evaluators served as the ground truth for verifying cluster label assignments.</p></sec><sec id="s2-4-3"><title>Phase 2: Summarize</title><p>The second phase generates summarization labels for each of the clusters. For both primary and secondary summarization, we leveraged OpenAI&#x2019;s GPT-4o model and designed zero-shot prompts for cluster labeling. This model was selected based on its general language and semantic understanding. Both the <italic>text-embedding-3-large</italic> and GPT-4o models were used as off-the-shelf, pretrained models without additional fine-tuning. Given that GPT-4o demonstrates strong zero-shot generalization across language tasks and that no domain-specific labeled training data were available, fine-tuning was deemed unnecessary for the summarization objectives of this study.</p><p>In both primary and secondary summarization, a temperature of 0 and top_p of 0.1 were used to minimize variability in LLM responses and control response quality. The specifics of the prompting can be found in <xref ref-type="fig" rid="figure2">Figure 2</xref>.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Prompting schema for primary and secondary summarization (example prompts; brief 5-word labels to minimize clutter).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="resprot_v15i1e86425_fig02.png"/></fig><p>To generate preliminary labels for each cluster, we provided 100 inclusion criteria that were randomly selected from each cluster along with a system and user prompt to the LLM. The LLM was prompted to generate a set of short, 5-word labels that provided a general summary of the specific criteria for each cluster. The short labels minimized visual clutter in the visualization application. The prompts could be altered to achieve varying levels of detail.</p><p>As primary summarization created some labels with a high degree of overlap, we used a similar prompting approach for secondary summarization whereby the LLM examined labels from primary summarization and identified semantically similar clusters. The merged clusters were given new 5-word labels by the model. The final cluster set included the merged clusters and clusters from the primary summarization that did not require reorganization.</p></sec><sec id="s2-4-4"><title>Phase 3: Visualize</title><p>To prepare the data for visualization, we performed a 2D reduction on all inclusion criteria embeddings using t-distributed stochastic neighbor embedding via scikit-learn. The resulting 2D coordinates were plotted on a scatterplot, with cluster label positions calculated by averaging the x and y coordinates of all criteria within each cluster. An interactive web application was developed using Three.js and React to display cluster data stratified by time and disease type. <xref ref-type="fig" rid="figure3">Figures 3</xref> and <xref ref-type="fig" rid="figure4">4</xref> provide screenshots of the visualization application. Features of the interactive tool are presented in detail in the Results section.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Interactive visualization: domain faceting, label hover highlighting, and dynamic cluster display.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="resprot_v15i1e86425_fig03.png"/></fig><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Temporal view: trial start date histogram and time window filtering.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="resprot_v15i1e86425_fig04.png"/></fig></sec></sec><sec id="s2-5"><title>Ethical Considerations</title><p>This study used only publicly available, deidentified clinical trial eligibility criteria data obtained from ClinicalTrials.gov. Therefore, the study did not require institutional review board approval or informed consent.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Overview</title><p>The culmination of our novel design and 3-phase system is a visualization tool that aims to provide users and researchers with an interactive method through which they can explore details of eligibility criteria for varying disease domains. Trends such as the distribution and evolution of criteria over time and the most common criteria can be observed using our tool. Currently, the tool allows users to interact with industry clinical trial inclusion criteria data for breast cancer, lung cancer, and GI oncology from ClinicalTrials.gov. However, following the designed pipeline of data extraction, preprocessing, clustering, summarization, and visualization, the tool is easily scalable to a wide array of disease domains. As of April 2026, the tool provides 3 features.</p></sec><sec id="s3-2"><title>Benchmarking Through Human Validation</title><p>A benchmark of the framework&#x2019;s clustering accuracy was conducted using human validation, with evaluators serving as the ground truth for assessing clustering and labeling performance. A simple random sample of 500 eligibility criteria, along with the complete list of potential cluster labels, was provided to the evaluators. For each criterion, 2 independent evaluators determined whether the assigned cluster label was appropriate. Of the 500 sampled criteria, evaluators deemed 470 (94%) to have the appropriate cluster label assignments. Detailed evaluation results are presented in <xref ref-type="table" rid="table2">Table 2</xref>.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Human validation benchmark results.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">Total labels evaluated, n</td><td align="left" valign="bottom">LLM<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup> correctly labeled samples, n</td><td align="left" valign="bottom">LLM incorrectly labeled samples, n</td><td align="left" valign="bottom">Accuracy (%)</td></tr></thead><tbody><tr><td align="left" valign="top">Human evaluator 1</td><td align="left" valign="top">250</td><td align="left" valign="top">239</td><td align="left" valign="top">11</td><td align="left" valign="top">95.6</td></tr><tr><td align="left" valign="top">Human evaluator 2</td><td align="left" valign="top">250</td><td align="left" valign="top">231</td><td align="left" valign="top">19</td><td align="left" valign="top">92.4</td></tr><tr><td align="left" valign="top">Total</td><td align="left" valign="top">500</td><td align="left" valign="top">470</td><td align="left" valign="top">30</td><td align="left" valign="top">94</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>LLM: large language model.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-3"><title>Feature 1: Criteria Clusters</title><p>A ranking of the most common eligibility criteria clusters is displayed within the tool; see <xref ref-type="table" rid="table3">Table 3</xref> for reference. Users can select a criteria cluster to highlight it alongside its corresponding label. The tool also includes an interactive hover feature that displays the quantity and distribution of eligibility criteria within each cluster.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Most common criteria clusters summarized.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Cluster rank</td><td align="left" valign="bottom">Breast cancer</td><td align="left" valign="bottom">Lung cancer</td><td align="left" valign="bottom">GI<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup> oncology</td></tr></thead><tbody><tr><td align="left" valign="top">1</td><td align="left" valign="top">Prior treatment conditions</td><td align="left" valign="top">ECOG<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup> performance status requirements</td><td align="left" valign="top">Age criteria for participation</td></tr><tr><td align="left" valign="top">2</td><td align="left" valign="top">Metastatic disease confirmation</td><td align="left" valign="top">Measurable disease criteria</td><td align="left" valign="top">ECOG performance status criteria</td></tr><tr><td align="left" valign="top">3</td><td align="left" valign="top">Age requirements</td><td align="left" valign="top">Effective contraception and pregnancy prevention</td><td align="left" valign="top">Informed consent requirements</td></tr><tr><td align="left" valign="top">4</td><td align="left" valign="top">Organ function requirements</td><td align="left" valign="top">Age requirements for participation</td><td align="left" valign="top">Adequate organ function requirements</td></tr><tr><td align="left" valign="top">5</td><td align="left" valign="top">ECOG performance status criteria</td><td align="left" valign="top">Prior treatment and therapy requirements</td><td align="left" valign="top">Measurable disease criteria</td></tr><tr><td align="left" valign="top">6</td><td align="left" valign="top">Contraception and pregnancy requirements</td><td align="left" valign="top">Minimum life expectancy criteria</td><td align="left" valign="top">Effective contraception requirement</td></tr><tr><td align="left" valign="top">7</td><td align="left" valign="top">Informed consent requirements</td><td align="left" valign="top">Informed consent requirements</td><td align="left" valign="top">Failed prior therapies or no options</td></tr><tr><td align="left" valign="top">8</td><td align="left" valign="top">Measurable disease criteria</td><td align="left" valign="top">Advanced, untreated, non&#x2013;small cell lung cancer</td><td align="left" valign="top">Recovery from prior cancer treatment</td></tr><tr><td align="left" valign="top">9</td><td align="left" valign="top">Breast cancer diagnosis requirements</td><td align="left" valign="top">Histologically confirmed advanced non&#x2013;small cell lung cancer</td><td align="left" valign="top">Prior treatment failure in CRC<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup></td></tr><tr><td align="left" valign="top">10</td><td align="left" valign="top">Treatment tolerance and recovery</td><td align="left" valign="top">Advanced, unresectable, or metastatic tumors</td><td align="left" valign="top">Advanced or metastatic cancer eligibility</td></tr><tr><td align="left" valign="top">11</td><td align="left" valign="top">Normal laboratory values</td><td align="left" valign="top">Advanced solid tumors refractory to treatment</td><td align="left" valign="top">Willingness and ability to comply</td></tr><tr><td align="left" valign="top">12</td><td align="left" valign="top">Tumor tissue and biopsy requirements</td><td align="left" valign="top">Performance status &#x2264;2; life expectancy</td><td align="left" valign="top">Histologically confirmed metastatic colorectal cancer</td></tr><tr><td align="left" valign="top">13</td><td align="left" valign="top">Life expectancy requirements</td><td align="left" valign="top">EGFR<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup> mutation treatment failure criteria</td><td align="left" valign="top">Advanced, unresectable, or refractory solid tumors</td></tr><tr><td align="left" valign="top">14</td><td align="left" valign="top">Normal liver function criteria required</td><td align="left" valign="top">Negative pregnancy test and contraception</td><td align="left" valign="top">Adequate hepatic function criteria</td></tr><tr><td align="left" valign="top">15</td><td align="left" valign="top">Postmenopausal women with defined criteria</td><td align="left" valign="top">Tumor tissue availability and consent</td><td align="left" valign="top">Confirmed diagnosis of hepatocellular carcinoma</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>GI: gastrointestinal.</p></fn><fn id="table3fn2"><p><sup>b</sup>ECOG: Eastern Cooperative Oncology Group.</p></fn><fn id="table3fn3"><p><sup>c</sup>CRC: colorectal cancer.</p></fn><fn id="table3fn4"><p><sup>d</sup>EGFR: epidermal growth factor receptor.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-4"><title>Feature 2: Interaction</title><p>The tool provides users with abilities such as zooming and panning to better interact with various areas of the scatterplot. A fixed scatter point size feature maintains point size regardless of zoom level. This allows for access to specific groups of data points and for investigation of the minutiae of criteria distribution. Another feature is label hovering. When a user hovers over the label of a cluster, all criteria within that cluster are highlighted through animation, enabling visualization of distribution and size of different inclusion criteria clusters.</p></sec><sec id="s3-5"><title>Feature 3: Time</title><p>Our tool allows users to filter displayed criteria over time. Criteria are organized by corresponding trial start date and plotted in colors corresponding to specific 5-year spans. Additionally, an interactive histogram allows users to adjust the trial start date window to filter for criteria within selected years.</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Anticipated Findings</title><p>In this paper, we propose a novel, generalizable pipeline for analyzing clinical trial eligibility criteria. Our system consists of 3 components&#x2014;semantic clustering, 2-stage summarization via LLMs, and an interactive visualization tool&#x2014;designed to extract, categorize, and present common inclusion criteria across disease domains. This approach enables scalable analysis of eligibility criteria and provides a foundation for improving automated patient-trial matching systems.</p><p>To demonstrate the feasibility of our approach, we developed a prototype site for analysis of breast cancer, lung cancer, and GI oncology trial criteria. As standardization and summarization of eligibility criteria are critical to automated patient matching systems, the proposed interactive tool may contribute to both the advancement of automated patient matching systems and the design of future clinical trials by providing valuable insights into important criteria trends. For example, the tool can be used to analyze the coverage of an automated clinical trial patient matching system, identifying the strengths and weaknesses of the system in selecting patients based on criterion areas. This has implications for patient health outcomes: overly restrictive or inconsistently applied eligibility criteria are a documented barrier to trial enrollment, particularly among underrepresented populations [<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref29">29</xref>]. By surfacing criteria trends across thousands of trials, the tools may equip trial designers with the evidence needed to identify criteria that may unnecessarily exclude eligible patients, streamline redundant requirements, and potentially broaden access to treatments. For clinicians and trial coordinators, the tool provides a reference for benchmarking a given trial&#x2019;s eligibility structure against established patterns in the field, supporting more informed and equitable protocol design.</p><p>First, our preliminary design leveraged data from ClinicalTrials.gov, focusing on a subset of industry-sponsored trials to ensure data consistency and relevance to real-world implementation. To maintain feasibility and depth of analysis, the prototype was scoped to the solid tumor domain, which represents a large and diverse set of oncology trials with substantial clinical and research interest. In addition, the clustering and summarization algorithms are far from perfect, sometimes leading to extraneous or out-of-scope clusters, labels, and results. Errors in cluster assignments or summarization labels could propagate to downstream applications, including automated patient-trial matching systems, by misrepresenting eligibility criteria categories; this risk is mitigated by the 2-stage filtration process, cosine similarity thresholding, and the human validation benchmark described in the Results section. This tool is meant to serve as a first step toward improving the coverage and capabilities of automated clinical trial patient matching systems, with the longer-term goal of reducing the time between patient identification and trial enrollment.</p><p>To expand application of the tool beyond solid tumor disease domains, future work should explore trials beyond the 3 oncology domains highlighted in this paper, as well as a wider array of foundational clustering algorithms and LLMs. Improvements in the capabilities of our designed system are also among potential future studies. For example, this may include expanding the tool beyond solid tumor oncology, expanding the trial database to additional registries and disease areas, benchmarking various clustering algorithms (eg, k-means and density-based spatial clustering of applications with noise) to improve grouping criteria clusters, and expanding the visualization dashboard with suites of filters and tools so researchers can more effectively investigate criteria coverage. These targeted enhancements will increase both the breadth and utility of the proposed system.</p></sec><sec id="s4-2"><title>Conclusions</title><p>This study demonstrates the feasibility and utility of an unsupervised, LLM-driven pipeline for structuring and visualizing clinical trial eligibility criteria at scale. By applying text embedding, clustering, and zero-shot summarization techniques, we were able to organize unstructured eligibility texts into interpretable clusters and generate domain-specific insights through an interactive visualization tool. Our findings reveal recurring patterns across disease domains&#x2014;such as consistent emphasis on performance status, organ function, and prior treatment history&#x2014;as well as domain-specific nuances such as differential emphasis on pregnancy prevention in breast cancer trials or molecular diagnostics in lung cancer. These patterns not only reflect current clinical practice but also point to areas where eligibility requirements could be streamlined or standardized to enhance patient access and diversity in trials.</p><p>The ability to surface and compare common eligibility themes across thousands of trials allows for more informed, data-driven protocol design, offering trial sponsors, researchers, and regulatory bodies a pathway toward reducing unnecessary complexity, improving feasibility, and minimizing barriers to enrollment. By embedding eligibility criteria into a structured, computable format, our framework also paves the way for integration with electronic health records and trial matching platforms, enhancing automation and reducing the manual burden in the recruitment process.</p><p>Although our prototype was limited to solid tumor oncology and used a subset of industry-sponsored trials from ClinicalTrials.gov, the methodology is readily generalizable. Future work will expand to additional disease areas, incorporate real-world data validation, and further optimize the NLP pipeline for deployment in clinical decision support systems. Ultimately, this framework lays the groundwork for a scalable, generalizable, and open-source infrastructure that can support more inclusive, efficient, and intelligent clinical trial design and matching.</p></sec></sec></body><back><ack><p>The authors thank the MedViz project for inspiring aspects of their visualization approach and Dr Huan He for his introduction of MedViz, which helped shape the conceptualization of this work. The authors declare the use of generative artificial intelligence (GenAI) in the research and writing process. According to the Generative Artificial Intelligence Delegation Taxonomy (2025), the following tasks were delegated to GenAI tools under full human supervision: text generation, proofreading and editing, and reformatting. The GenAI tool used was GPT-5.2 (OpenAI). Responsibility for the final manuscript lies entirely with the authors. GenAI tools are not listed as authors and do not bear responsibility for the final outcomes.</p></ack><notes><sec><title>Funding</title><p>This study was funded by the Yale New Haven Health Innovation Award as part of its Health Innovation Program (Clinical Trial Patient Matching project; PI: GG). The project is supported for a 2.5-year period from July 1, 2024, to December 31, 2026, with total funding of US $100,000 [<xref ref-type="bibr" rid="ref30">30</xref>].</p></sec><sec><title>Data Availability</title><p>The datasets generated or analyzed during this study are available from the corresponding author on reasonable request [<xref ref-type="bibr" rid="ref31">31</xref>].</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization: GG</p><p>Data curation: JX, JP</p><p>Formal analysis: GG, JX</p><p>Methodology: GG</p><p>Software: JX, JP, GG</p><p>Supervision: GG</p><p>Visualization: JX, JP</p><p>Writing&#x2014;original draft: JX, GG</p><p>Writing&#x2014;review and editing: all authors</p></fn><fn fn-type="conflict"><p>GG is the founder of CtrlTrial Inc, a company leveraging artificial intelligence and real-world data to accelerate clinical trial design and patient enrollment. All other authors declare no other conflicts of interest.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">API</term><def><p>application programming interface</p></def></def-item><def-item><term id="abb2">GI</term><def><p>gastrointestinal</p></def></def-item><def-item><term id="abb3">LLM</term><def><p>large language model</p></def></def-item><def-item><term id="abb4">NLP</term><def><p>natural language processing</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Van Spall</surname><given-names>HG</given-names> </name><name name-style="western"><surname>Toren</surname><given-names>A</given-names> </name><name name-style="western"><surname>Kiss</surname><given-names>A</given-names> </name><name name-style="western"><surname>Fowler</surname><given-names>RA</given-names> </name></person-group><article-title>Eligibility criteria of randomized controlled trials published in high-impact general medical journals: a systematic sampling review</article-title><source>JAMA</source><year>2007</year><month>03</month><day>21</day><volume>297</volume><issue>11</issue><fpage>1233</fpage><lpage>1240</lpage><pub-id pub-id-type="doi">10.1001/jama.297.11.1233</pub-id><pub-id pub-id-type="medline">17374817</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>ES</given-names> </name><name name-style="western"><surname>Bernstein</surname><given-names>D</given-names> </name><name name-style="western"><surname>Hilsenbeck</surname><given-names>SG</given-names> </name><etal/></person-group><article-title>Modernizing eligibility criteria for molecularly driven trials</article-title><source>J Clin Oncol</source><year>2015</year><month>09</month><day>1</day><volume>33</volume><issue>25</issue><fpage>2815</fpage><lpage>2820</lpage><pub-id pub-id-type="doi">10.1200/JCO.2015.62.1854</pub-id><pub-id pub-id-type="medline">26195710</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Weng</surname><given-names>C</given-names> </name><name name-style="western"><surname>Tu</surname><given-names>SW</given-names> </name><name name-style="western"><surname>Sim</surname><given-names>I</given-names> </name><name name-style="western"><surname>Richesson</surname><given-names>R</given-names> </name></person-group><article-title>Formal representation of eligibility criteria: a literature review</article-title><source>J Biomed Inform</source><year>2010</year><month>06</month><volume>43</volume><issue>3</issue><fpage>451</fpage><lpage>467</lpage><pub-id pub-id-type="doi">10.1016/j.jbi.2009.12.004</pub-id><pub-id pub-id-type="medline">20034594</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ross</surname><given-names>J</given-names> </name><name name-style="western"><surname>Tu</surname><given-names>S</given-names> </name><name name-style="western"><surname>Carini</surname><given-names>S</given-names> </name><name name-style="western"><surname>Sim</surname><given-names>I</given-names> </name></person-group><article-title>Analysis of eligibility criteria complexity in clinical trials</article-title><source>Summit Transl Bioinform</source><year>2010</year><month>03</month><day>1</day><volume>2010</volume><fpage>46</fpage><lpage>50</lpage><pub-id pub-id-type="medline">21347148</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Embi</surname><given-names>PJ</given-names> </name><name name-style="western"><surname>Jain</surname><given-names>A</given-names> </name><name name-style="western"><surname>Clark</surname><given-names>J</given-names> </name><name name-style="western"><surname>Harris</surname><given-names>CM</given-names> </name></person-group><article-title>Development of an electronic health record-based Clinical Trial Alert system to enhance recruitment at the point of care</article-title><source>AMIA Annu Symp Proc</source><year>2005</year><volume>2005</volume><fpage>231</fpage><lpage>235</lpage><pub-id pub-id-type="medline">16779036</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Treweek</surname><given-names>S</given-names> </name><name name-style="western"><surname>Pitkethly</surname><given-names>M</given-names> </name><name name-style="western"><surname>Cook</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Strategies to improve recruitment to randomised trials</article-title><source>Cochrane Database Syst Rev</source><year>2018</year><month>02</month><day>22</day><volume>2</volume><issue>2</issue><fpage>MR000013</fpage><pub-id pub-id-type="doi">10.1002/14651858.MR000013.pub6</pub-id><pub-id pub-id-type="medline">29468635</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>K&#x00F6;pcke</surname><given-names>F</given-names> </name><name name-style="western"><surname>Kraus</surname><given-names>S</given-names> </name><name name-style="western"><surname>Scholler</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Secondary use of routinely collected patient data in a clinical trial: an evaluation of the effects on patient recruitment and data acquisition</article-title><source>Int J Med Inform</source><year>2013</year><month>03</month><volume>82</volume><issue>3</issue><fpage>185</fpage><lpage>192</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://pubmed.ncbi.nlm.nih.gov/23266063/">https://pubmed.ncbi.nlm.nih.gov/23266063/</ext-link></comment><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2012.11.008</pub-id><pub-id pub-id-type="medline">23266063</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Weng</surname><given-names>C</given-names> </name><name name-style="western"><surname>Batres</surname><given-names>C</given-names> </name><name name-style="western"><surname>Borda</surname><given-names>T</given-names> </name><etal/></person-group><article-title>A real-time screening alert improves patient recruitment efficiency</article-title><source>AMIA Annu Symp Proc</source><year>2011</year><volume>2011</volume><fpage>1489</fpage><lpage>1498</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://pubmed.ncbi.nlm.nih.gov/22195213/">https://pubmed.ncbi.nlm.nih.gov/22195213/</ext-link></comment><pub-id pub-id-type="medline">22195213</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ni</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wright</surname><given-names>J</given-names> </name><name name-style="western"><surname>Perentesis</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Increasing the efficiency of trial-patient matching: automated clinical trial eligibility pre-screening for pediatric oncology patients</article-title><source>BMC Med Inform Decis Mak</source><year>2015</year><month>04</month><day>14</day><volume>15</volume><fpage>28</fpage><pub-id pub-id-type="doi">10.1186/s12911-015-0149-3</pub-id><pub-id pub-id-type="medline">25881112</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Luo</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Sohani</surname><given-names>AR</given-names> </name><name name-style="western"><surname>Hochberg</surname><given-names>EP</given-names> </name><name name-style="western"><surname>Szolovits</surname><given-names>P</given-names> </name></person-group><article-title>Automatic lymphoma classification with sentence subgraph mining from pathology reports</article-title><source>J Am Med Inform Assoc</source><year>2014</year><volume>21</volume><issue>5</issue><fpage>824</fpage><lpage>832</lpage><pub-id pub-id-type="doi">10.1136/amiajnl-2013-002443</pub-id><pub-id pub-id-type="medline">24431333</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>N&#x00E9;v&#x00E9;ol</surname><given-names>A</given-names> </name><name name-style="western"><surname>Dalianis</surname><given-names>H</given-names> </name><name name-style="western"><surname>Velupillai</surname><given-names>S</given-names> </name><name name-style="western"><surname>Savova</surname><given-names>G</given-names> </name><name name-style="western"><surname>Zweigenbaum</surname><given-names>P</given-names> </name></person-group><article-title>Clinical natural language processing in languages other than English: opportunities and challenges</article-title><source>J Biomed Semantics</source><year>2018</year><month>03</month><day>30</day><volume>9</volume><issue>1</issue><fpage>12</fpage><comment><ext-link ext-link-type="uri" xlink:href="https://pubmed.ncbi.nlm.nih.gov/29602312/">https://pubmed.ncbi.nlm.nih.gov/29602312/</ext-link></comment><pub-id pub-id-type="doi">10.1186/s13326-018-0179-8</pub-id><pub-id pub-id-type="medline">29602312</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kormilitzin</surname><given-names>A</given-names> </name><name name-style="western"><surname>Vaci</surname><given-names>N</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Nevado-Holgado</surname><given-names>A</given-names> </name></person-group><article-title>Med7: A transferable clinical natural language processing model for electronic health records</article-title><source>Artif Intell Med</source><year>2021</year><month>08</month><volume>118</volume><fpage>102086</fpage><comment><ext-link ext-link-type="uri" xlink:href="https://pubmed.ncbi.nlm.nih.gov/34412834/">https://pubmed.ncbi.nlm.nih.gov/34412834/</ext-link></comment><pub-id pub-id-type="doi">10.1016/j.artmed.2021.102086</pub-id><pub-id pub-id-type="medline">34412834</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yuan</surname><given-names>C</given-names> </name><name name-style="western"><surname>Ryan</surname><given-names>PB</given-names> </name><name name-style="western"><surname>Ta</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Criteria2Query: a natural language interface to clinical databases for cohort definition</article-title><source>J Am Med Inform Assoc</source><year>2019</year><month>04</month><day>1</day><volume>26</volume><issue>4</issue><fpage>294</fpage><lpage>305</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocy178</pub-id><pub-id pub-id-type="medline">30753493</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Devlin</surname><given-names>J</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>MW</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>K</given-names> </name><name name-style="western"><surname>Toutanova</surname><given-names>K</given-names> </name></person-group><article-title>BERT: pre-training of deep bidirectional transformers for language understanding</article-title><conf-name>Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies</conf-name><conf-date>Jun 2-7, 2019</conf-date><comment><ext-link ext-link-type="uri" xlink:href="https://aclanthology.org/N19-1423/">https://aclanthology.org/N19-1423/</ext-link></comment><pub-id pub-id-type="doi">10.18653/v1/N19-1423</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>J</given-names> </name><name name-style="western"><surname>Yoon</surname><given-names>W</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>S</given-names> </name><etal/></person-group><article-title>BioBERT: a pre-trained biomedical language representation model for biomedical text mining</article-title><source>Bioinformatics</source><year>2020</year><month>02</month><day>15</day><volume>36</volume><issue>4</issue><fpage>1234</fpage><lpage>1240</lpage><pub-id pub-id-type="doi">10.1093/bioinformatics/btz682</pub-id><pub-id pub-id-type="medline">31501885</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Alsentzer</surname><given-names>E</given-names> </name><name name-style="western"><surname>Murphy</surname><given-names>J</given-names> </name><name name-style="western"><surname>Boag</surname><given-names>W</given-names> </name><etal/></person-group><article-title>Publicly available clinical BERT embeddings</article-title><conf-name>Proceedings of the 2nd Clinical Natural Language Processing Workshop</conf-name><conf-date>Jun 7, 2019</conf-date><pub-id pub-id-type="doi">10.18653/v1/W19-1909</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Singhal</surname><given-names>K</given-names> </name><name name-style="western"><surname>Azizi</surname><given-names>S</given-names> </name><name name-style="western"><surname>Tu</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Large language models encode clinical knowledge</article-title><source>Nature</source><year>2023</year><month>08</month><volume>620</volume><issue>7972</issue><fpage>172</fpage><lpage>180</lpage><pub-id pub-id-type="doi">10.1038/s41586-023-06291-2</pub-id><pub-id pub-id-type="medline">37438534</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kung</surname><given-names>TH</given-names> </name><name name-style="western"><surname>Cheatham</surname><given-names>M</given-names> </name><name name-style="western"><surname>Medenilla</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Performance of ChatGPT on USMLE: potential for AI-assisted medical education using large language models</article-title><source>PLOS Digit Health</source><year>2023</year><month>02</month><volume>2</volume><issue>2</issue><fpage>e0000198</fpage><pub-id pub-id-type="doi">10.1371/journal.pdig.0000198</pub-id><pub-id pub-id-type="medline">36812645</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Nori</surname><given-names>H</given-names> </name><name name-style="western"><surname>King</surname><given-names>N</given-names> </name><name name-style="western"><surname>McKinney</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Carignan</surname><given-names>D</given-names> </name><name name-style="western"><surname>Horvitz</surname><given-names>E</given-names> </name></person-group><article-title>Capabilities of GPT-4 on medical challenge problems</article-title><source>arXiv</source><comment>Preprint posted online on  Mar 20, 2023</comment><pub-id pub-id-type="doi">10.48550/arXiv.2303.13375</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tinn</surname><given-names>R</given-names> </name><name name-style="western"><surname>Cheng</surname><given-names>H</given-names> </name><name name-style="western"><surname>Gu</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Fine-tuning large neural language models for biomedical natural language processing</article-title><source>Patterns (N Y)</source><year>2023</year><month>04</month><day>14</day><volume>4</volume><issue>4</issue><fpage>100729</fpage><comment><ext-link ext-link-type="uri" xlink:href="https://pubmed.ncbi.nlm.nih.gov/37123444/">https://pubmed.ncbi.nlm.nih.gov/37123444/</ext-link></comment><pub-id pub-id-type="doi">10.1016/j.patter.2023.100729</pub-id><pub-id pub-id-type="medline">37123444</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ayers</surname><given-names>JW</given-names> </name><name name-style="western"><surname>Poliak</surname><given-names>A</given-names> </name><name name-style="western"><surname>Dredze</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Comparing physician and artificial intelligence chatbot responses to patient questions posted to a public social media forum</article-title><source>JAMA Intern Med</source><year>2023</year><month>06</month><day>1</day><volume>183</volume><issue>6</issue><fpage>589</fpage><lpage>596</lpage><pub-id pub-id-type="doi">10.1001/jamainternmed.2023.1838</pub-id><pub-id pub-id-type="medline">37115527</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jin</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Floudas</surname><given-names>CS</given-names> </name><etal/></person-group><article-title>Matching patients to clinical trials with large language models</article-title><source>Nat Commun</source><year>2023</year><volume>15</volume><issue>1</issue><pub-id pub-id-type="doi">10.1038/s41467-024-53081-z</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Bolton</surname><given-names>E</given-names> </name><name name-style="western"><surname>Venigalla</surname><given-names>A</given-names> </name><name name-style="western"><surname>Yasunaga</surname><given-names>M</given-names> </name></person-group><article-title>Biomedlm: a 2.7B parameter language model trained on biomedical text</article-title><source>arXiv</source><comment>Preprint posted online on  Mar 27, 2024</comment><pub-id pub-id-type="doi">10.48550/arXiv.2403.18421</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kang</surname><given-names>T</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>S</given-names> </name><name name-style="western"><surname>Tang</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>EliIE: An open-source information extraction system for clinical trial eligibility criteria</article-title><source>J Am Med Inform Assoc</source><year>2017</year><month>11</month><day>1</day><volume>24</volume><issue>6</issue><fpage>1062</fpage><lpage>1071</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://pmc.ncbi.nlm.nih.gov/articles/PMC6259668/">https://pmc.ncbi.nlm.nih.gov/articles/PMC6259668/</ext-link></comment><pub-id pub-id-type="doi">10.1093/jamia/ocx019</pub-id><pub-id pub-id-type="medline">28379377</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Unger</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Hershman</surname><given-names>DL</given-names> </name><name name-style="western"><surname>Osarogiagbon</surname><given-names>RU</given-names> </name><etal/></person-group><article-title>Representativeness of Black patients in cancer clinical trials sponsored by the National Cancer Institute compared with pharmaceutical companies</article-title><source>JNCI Cancer Spectr</source><year>2020</year><month>08</month><volume>4</volume><issue>4</issue><fpage>pkaa034</fpage><comment><ext-link ext-link-type="uri" xlink:href="https://academic.oup.com/jncics/article/4/4/pkaa034/5824796?guestAccessKey=">https://academic.oup.com/jncics/article/4/4/pkaa034/5824796?guestAccessKey=</ext-link></comment><pub-id pub-id-type="doi">10.1093/jncics/pkaa034</pub-id><pub-id pub-id-type="medline">32704619</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="web"><source>MedViz</source><access-date>2025-07-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://medviz.org/">https://medviz.org/</ext-link></comment></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kumar</surname><given-names>G</given-names> </name><name name-style="western"><surname>Chaudhary</surname><given-names>P</given-names> </name><name name-style="western"><surname>Quinn</surname><given-names>A</given-names> </name><name name-style="western"><surname>Su</surname><given-names>D</given-names> </name></person-group><article-title>Barriers for cancer clinical trial enrollment: a qualitative study of the perspectives of healthcare providers</article-title><source>Contemp Clin Trials Commun</source><year>2022</year><volume>28</volume><fpage>100939</fpage><pub-id pub-id-type="doi">10.1016/j.conctc.2022.100939</pub-id><pub-id pub-id-type="medline">35707483</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>ES</given-names> </name><name name-style="western"><surname>Uldrick</surname><given-names>TS</given-names> </name><name name-style="western"><surname>Schenkel</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Continuing to broaden eligibility criteria to make clinical trials more representative and inclusive: ASCO-friends of cancer research joint research statement</article-title><source>Clin Cancer Res</source><year>2021</year><month>05</month><day>1</day><volume>27</volume><issue>9</issue><fpage>2394</fpage><lpage>2399</lpage><pub-id pub-id-type="doi">10.1158/1078-0432.CCR-20-3852</pub-id><pub-id pub-id-type="medline">33563632</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yousafi</surname><given-names>S</given-names> </name><name name-style="western"><surname>Rangachari</surname><given-names>P</given-names> </name><name name-style="western"><surname>Holland</surname><given-names>ML</given-names> </name></person-group><article-title>Barriers to recruitment and retention among underrepresented populations in cancer clinical trials: a qualitative study of the perspectives of clinical trial research coordinating staff at a cancer center</article-title><source>J Healthc Leadersh</source><year>2024</year><volume>16</volume><fpage>427</fpage><lpage>441</lpage><pub-id pub-id-type="doi">10.2147/JHL.S488426</pub-id><pub-id pub-id-type="medline">39502080</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="web"><article-title>YNHHS innovation awards</article-title><source>Yale New Haven Health</source><access-date>2026-05-01</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.ynhhs.org/about/innovation-initiatives/health-innovation/2024-Award-Winners/Clinical-Trial">https://www.ynhhs.org/about/innovation-initiatives/health-innovation/2024-Award-Winners/Clinical-Trial</ext-link></comment></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="web"><article-title>CtrlTrial criteria visualizer</article-title><source>GitHub</source><access-date>2026-05-01</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://github.com/ctrltrial/CriteriaVisualizer">https://github.com/ctrltrial/CriteriaVisualizer</ext-link></comment></nlm-citation></ref></ref-list></back></article>