<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Res Protoc</journal-id><journal-id journal-id-type="publisher-id">ResProt</journal-id><journal-id journal-id-type="index">5</journal-id><journal-title>JMIR Research Protocols</journal-title><abbrev-journal-title>JMIR Res Protoc</abbrev-journal-title><issn pub-type="epub">1929-0748</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v15i1e89279</article-id><article-id pub-id-type="doi">10.2196/89279</article-id><article-categories><subj-group subj-group-type="heading"><subject>Protocol</subject></subj-group></article-categories><title-group><article-title>An Explainable AI Framework for Continuous Monitoring, Risk Stratification, and Clinical Decision Support in Primary Biliary Cholangitis: Protocol for a Multiphase Development and Validation Study</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Njei</surname><given-names>Basile</given-names></name><degrees>MPH, MD, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Sidney Kanmounye</surname><given-names>Ulrick</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib></contrib-group><aff id="aff1"><institution>Engelhardt School of Global Health and Bioethics, Euclid University</institution><addr-line>Avenue de France, Campus ENAM</addr-line><addr-line>Bangui</addr-line><country>Central African Republic</country></aff><aff id="aff2"><institution>Association of Future African Neurosurgeons</institution><addr-line>Yaounde</addr-line><country>Cameroon</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Sarvestan</surname><given-names>Javad</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Sun</surname><given-names>Chunbao</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Basile Njei, MPH, MD, PhD, Engelhardt School of Global Health and Bioethics, Euclid University, Avenue de France, Campus ENAM, Bangui, BP 157, Central African Republic, +236 21 61 59 2; <email>basilenjei@gmail.com</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>24</day><month>6</month><year>2026</year></pub-date><volume>15</volume><elocation-id>e89279</elocation-id><history><date date-type="received"><day>09</day><month>12</month><year>2025</year></date><date date-type="rev-recd"><day>24</day><month>04</month><year>2026</year></date><date date-type="accepted"><day>27</day><month>04</month><year>2026</year></date></history><copyright-statement>&#x00A9; Basile Njei, Ulrick Sidney Kanmounye. Originally published in JMIR Research Protocols (<ext-link ext-link-type="uri" xlink:href="https://www.researchprotocols.org">https://www.researchprotocols.org</ext-link>), 24.6.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Research Protocols, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.researchprotocols.org">https://www.researchprotocols.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://www.researchprotocols.org/2026/1/e89279"/><abstract><sec><title>Background</title><p>Primary biliary cholangitis (PBC) management remains limited by reliance on static biochemical markers, fragmented assessment of symptom burden, and inadequate noninvasive risk stratification for clinically significant portal hypertension (CSPH). Existing tools fail to integrate longitudinal laboratory trends, elastography, and patient-reported outcomes, and translation of risk assessment into guideline-concordant clinical action remains inconsistent.</p></sec><sec><title>Objective</title><p>This study aims to develop, validate, and pilot an explainable artificial intelligence (AI) framework&#x2014;AIm-PBC&#x2014;for continuous disease monitoring, early prediction of CSPH complications, and delivery of guideline-based clinical decision support in patients with PBC.</p></sec><sec sec-type="methods"><title>Methods</title><p>We will conduct a multiphase study combining retrospective cohort analysis, prospective observational data collection, and implementation evaluation. At least 600 adults with confirmed PBC will be enrolled across academic hepatology centers. The AI framework will integrate longitudinal biochemical markers, noninvasive elastography metrics, and high-frequency patient-reported outcomes to generate an interpretable disease activity index and predict CSPH-related complications using gradient-boosted models with Shapley additive explanations. Outputs will be deployed via a SMART-on-FHIR (Substitutable Medical Applications, Reusable Technologies on Fast Healthcare Interoperability Resources)&#x2013;enabled electronic health record clinical decision support tool. Implementation will be evaluated using a randomized crossover simulation followed by a pragmatic pilot assessing usability, cognitive load, clinician adherence, and feasibility.</p></sec><sec sec-type="results"><title>Results</title><p>The primary outcomes include calibration and responsiveness of the disease activity index; discriminatory performance of the CSPH prediction model compared with established criteria; and effectiveness of the decision support tool measured via improvements in guideline-concordant care, usability scores, and clinician cognitive workload. Secondary outcomes include fairness metrics and workflow efficiency.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This protocol outlines a scalable, explainable AI framework designed to bridge gaps between disease monitoring, risk prediction, and clinical action in PBC. If successful, AIm-PBC may enhance early complication detection, improve symptom management, and support equitable, evidence-based care delivery in routine hepatology practice.</p></sec><sec sec-type="registered-report"><title>International Registered Report Identifier (IRRID)</title><p>PRR1-10.2196/89279</p></sec></abstract><kwd-group><kwd>artificial intelligence</kwd><kwd>AI</kwd><kwd>primary biliary cholangitis</kwd><kwd>randomized controlled trials</kwd><kwd>clinical decision support</kwd><kwd>portal hypertension</kwd><kwd>explainable artificial intelligence</kwd><kwd>patient-reported outcomes</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Background</title><p>Despite advances in primary biliary cholangitis (PBC) therapy, significant gaps persist in monitoring disease activity, predicting complications, and delivering guideline-concordant care [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref4">4</xref>]. Current management strategies rely heavily on biochemical markers such as alkaline phosphatase (ALP) and bilirubin, which often fail to capture dynamic symptom fluctuations or early progression toward clinically significant portal hypertension (CSPH) [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. This limitation delays timely intervention and contributes to morbidity [<xref ref-type="bibr" rid="ref7">7</xref>].</p><p>Risk stratification for portal hypertension, a complication of PBC, remains particularly challenging [<xref ref-type="bibr" rid="ref8">8</xref>]. Invasive procedures such as endoscopy are frequently used for variceal screening, yet these approaches are resource intensive and carry procedural risks [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. Noninvasive surrogates, including liver stiffness measurement (LSM) and spleen stiffness measurement (SSM), have demonstrated promise in predicting CSPH and reducing unnecessary endoscopies [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. However, these modalities are rarely integrated with longitudinal biochemical data or patient-reported outcomes (PROs), leaving clinicians without a comprehensive, real-time view of disease trajectory [<xref ref-type="bibr" rid="ref10">10</xref>]. Even when risk is identified, translating insights into action remains challenging. Clinicians face cognitive overload and workflow fragmentation, leading to missed opportunities for guideline-based interventions such as pruritus step therapy, bone health management, and CSPH screening [<xref ref-type="bibr" rid="ref3">3</xref>].</p><p>Symptom burden represents another critical dimension of PBC care. Validated instruments such as the Worst Itch Numeric Rating Scale (WI-NRS) and PBC-40 provide reliable measures of symptom severity [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. Similarly to risk stratification tools, symptom burden tools are underused in routine practice and seldom incorporated into predictive models.</p></sec><sec id="s1-2"><title>Proposed Solution</title><p>Artificial intelligence (AI) offers an opportunity to address these gaps by integrating heterogeneous data streams, including biochemical markers, elastography metrics, and PROs, into dynamic, explainable models capable of continuous monitoring and risk prediction [<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref14">14</xref>]. By developing an agentic AI system that integrates longitudinal biochemical data, elastography metrics, and high-frequency PROs, we aim to provide clinicians with a dynamic, explainable disease activity index. This approach will enable proactive management of symptoms and early identification of nonresponders [<xref ref-type="bibr" rid="ref15">15</xref>], reducing morbidity and improving patient-centered outcomes. Our multi-signal predictive model will integrate elastography, platelet count, biochemical response, and comorbidity profiles to accurately identify patients at high risk of early CSPH complications. This composite approach promises to reduce unnecessary endoscopies while ensuring timely prophylaxis for those at greatest risk. By embedding explainable AI outputs into an electronic health record (EHR)&#x2013;integrated clinical decision support (CDS) tool, we aim to bridge the gap between prediction and practice. This prototype will feature interpretable risk cards and dual-threshold triage cues, ensuring usability and trust while promoting equity across diverse clinical settings. While machine learning algorithms have shown promise in chronic liver disease, most operate as &#x201C;black boxes,&#x201D; limiting clinician trust and adoption. Consequently, we aim to use Shapley additive explanations (SHAP) combined with dual-threshold triage strategies to enhance transparency and usability.</p></sec><sec id="s1-3"><title>Study Aim</title><p>This protocol describes a multiphase study designed to develop, validate, and pilot this explainable AI framework for PBC management. The proposed framework, named AIm-PBC system, will integrate longitudinal multi-signal data to (1) provide continuous, interpretable assessment of disease activity and symptom burden; (2) predict CSPH complications using a composite noninvasive model; and (3) operationalize guideline-concordant care through an EHR-integrated CDS prototype (<xref ref-type="fig" rid="figure1">Figure 1</xref>). By leveraging implementation science principles, this study aims to ensure feasibility, usability, and equity across diverse clinical environments.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Conceptual framework for the explainable artificial intelligence (AI) system for symptom and disease monitoring, early portal hypertension prediction, and remote clinical decision support (CDS) in primary biliary cholangitis (PBC). ALP: alkaline phosphatase; AQFIB-4: Fibrosis-4 index for liver fibrosis; CSPH: clinically significant portal hypertension; DO: doctor of osteopathic medicine; EHR: electronic health record; MD: doctor of medicine; NP: nurse practitioner; PA: physician assistant.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="resprot_v15i1e89279_fig01.png"/></fig></sec><sec id="s1-4"><title>Hypothesis</title><p>We hypothesize that this integrated, explainable AI approach will outperform conventional monitoring strategies, improve risk stratification for CSPH, and enhance clinician adherence to evidence-based care pathways, ultimately reducing symptom burden and preventing complications in patients with PBC.</p></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design</title><p>This multiphase study will combine retrospective cohort analysis, prospective observational data collection, and implementation science evaluation using a randomized crossover simulation followed by a pragmatic pilot. Its aims address critical unmet needs in PBC care by leveraging explainable AI to integrate multimodal data streams, predict complications, and operationalize evidence-based management. The study consists of 3 sequential phases: retrospective model development, prospective simulation testing, and real-world implementation. A summary of the objectives, data sources, participants, and outcomes for each phase is provided in <xref ref-type="table" rid="table1">Table 1</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Overview of study phases, objectives, data sources, and outcomes.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Phase</td><td align="left" valign="bottom">Study type</td><td align="left" valign="bottom">Objective</td><td align="left" valign="bottom">Data sources</td><td align="left" valign="bottom">Participants</td><td align="left" valign="bottom">Primary outcomes</td></tr></thead><tbody><tr><td align="left" valign="top">Phase 1: model development and retrospective validation</td><td align="left" valign="top">Retrospective analysis</td><td align="left" valign="top">To develop and retrospectively validate the AI<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup>-based predictive model for PBC<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup>-associated significant fibrosis using existing clinical datasets</td><td align="left" valign="top">Retrospective EHR<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup> datasets and previously collected clinical variables</td><td align="left" valign="top">Adult patients with MASLD and available fibrosis assessment data</td><td align="left" valign="top">Model discrimination and calibration for predicting significant fibrosis (eg, AUROC<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup>, sensitivity, and specificity)</td></tr><tr><td align="left" valign="top">Phase 2: prospective simulation and workflow testing</td><td align="left" valign="top">Prospective simulation</td><td align="left" valign="top">To evaluate how the AI system performs within simulated primary care workflows and refine decision thresholds and outputs</td><td align="left" valign="top">Prospective simulated clinical cases and structured datasets reflecting real-world patient characteristics</td><td align="left" valign="top">Simulated patient scenarios evaluated by clinicians using the AI decision support system</td><td align="left" valign="top">Diagnostic accuracy, workflow integration feasibility, and clinician usability metrics</td></tr><tr><td align="left" valign="top">Phase 3: real-world clinical implementation</td><td align="left" valign="top">Prospective real-world implementation</td><td align="left" valign="top">To assess the clinical performance and implementation feasibility of the AI decision support system in routine care</td><td align="left" valign="top">Real-world clinical data collected during system deployment in participating clinical settings</td><td align="left" valign="top">Adult patients undergoing evaluation for MASLD in real clinical practice</td><td align="left" valign="top">Detection rate of significant fibrosis, clinical decision impact, and implementation feasibility metrics</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>AI: artificial intelligence.</p></fn><fn id="table1fn2"><p><sup>b</sup>PBC: primary biliary cholangitis. </p></fn><fn id="table1fn3"><p><sup>c</sup>EHR: electronic health record.</p></fn><fn id="table1fn4"><p><sup>d</sup>AUROC: area under the receiver operating characteristic curve.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-2"><title>Study Setting</title><p>The study will be conducted across multiple hepatology clinics affiliated with academic medical centers in the United States. The CDS pilot will be implemented within EHR environments supporting SMART-on-FHIR (Substitutable Medical Applications, Reusable Technologies on Fast Healthcare Interoperability Resources) integration.</p></sec><sec id="s2-3"><title>Eligibility Criteria</title><p>Adults aged 18 years or older with a confirmed diagnosis of PBC according to American Association for the Study of Liver Diseases criteria (ie, defined as elevated ALP of &#x2265;1.5 times the upper limit of normal in combination with a positive antimitochondrial antibody or disease-specific antinuclear antibodies such as sp100 or gp210) [<xref ref-type="bibr" rid="ref2">2</xref>]. For individuals who are seronegative, histological confirmation through liver biopsy will be mandatory. All participants must have been receiving standard therapeutic dosing of ursodeoxycholic acid for a minimum of 3 months prior to enrollment, defined as 13 to 15 mg per kilogram of body weight per day administered in 2 or 3 divided doses [<xref ref-type="bibr" rid="ref2">2</xref>]. Patients who are on second-line therapies, including farnesoid X receptor agonists or peroxisome proliferator&#x2013;activated receptor agonists, will also be eligible, and therapy class will be recorded as a covariate. Additionally, baseline elastography data, including LSM and SSM, must be available within 6 months of enrollment.</p><p>Individuals will be excluded if they have previously undergone liver transplantation or are currently listed for transplantation or if they present with decompensated cirrhosis at baseline, defined as Child-Pugh class B or C [<xref ref-type="bibr" rid="ref16">16</xref>]. Other exclusion criteria include active malignancy, uncontrolled systemic illness, pregnancy, or inability to provide informed consent. Patients with significant alcohol consumption within 6 months of enrollment (ie, more than 20 grams per day for female individuals or more than 30 grams per day for male individuals or an Alcohol Use Disorders Identification Test&#x2013;Consumption score of 4 or higher) [<xref ref-type="bibr" rid="ref17">17</xref>] will not be eligible. Additional exclusions are coexisting chronic liver diseases such as chronic viral hepatitis, hemochromatosis, Wilson disease, or alpha-1 antitrypsin deficiency, as well as active or suspected drug-induced liver injury within the prior 6 months, including drug-induced autoimmune hepatitis (AIH). Any condition deemed by the investigators to compromise participant safety or data integrity will also result in exclusion. A summary of inclusion and exclusion criteria is provided in <xref ref-type="other" rid="box1">Textbox 1</xref>.</p><p>To enable subgroup analyses, participants will be stratified by the presence of AIH overlap, defined using the Paris criteria [<xref ref-type="bibr" rid="ref18">18</xref>], and by the presence of metabolic dysfunction&#x2013;associated steatohepatitis (MASH), identified through structured chart abstraction and imaging or laboratory features [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref21">21</xref>]. Stratification will also occur based on biochemical response status at 12 months following initiation of ursodeoxycholic acid therapy, categorized using established UK-PBC and GLOBE risk scores [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>].</p><boxed-text id="box1"><title> Inclusion and exclusion criteria.</title><p><bold>Inclusion criteria</bold></p><list list-type="bullet"><list-item><p>Adults aged &#x2265;18 y</p></list-item><list-item><p>Confirmed diagnosis of primary biliary cholangitis according to American Association for the Study of Liver Diseases criteria, defined as elevated alkaline phosphatase of &#x2265;1.5 times the upper limit of normal with positive antimitochondrial antibody or disease-specific antinuclear antibodies such as sp100 or gp210 [<xref ref-type="bibr" rid="ref2">2</xref>]</p></list-item><list-item><p>For seronegative individuals, histological confirmation via liver biopsy</p></list-item><list-item><p>Receiving standard therapeutic dosing of ursodeoxycholic acid for &#x2265;3 mo before enrollment, defined as 13 to 15 mg per kilogram per day in 2 or 3 divided doses [<xref ref-type="bibr" rid="ref2">2</xref>]</p></list-item><list-item><p>Patients receiving second-line therapies, including farnesoid X receptor agonists or peroxisome proliferator&#x2013;activated receptor agonists, with therapy class recorded as a covariate</p></list-item><list-item><p>Baseline elastography data, including liver stiffness measurement and spleen stiffness measurement, available within 6 mo of enrollment</p></list-item></list><p><bold>Exclusion criteria</bold></p><list list-type="bullet"><list-item><p>Prior liver transplantation or currently listed for liver transplantation</p></list-item><list-item><p>Decompensated cirrhosis at baseline, defined as Child-Pugh class B or C [<xref ref-type="bibr" rid="ref16">16</xref>]</p></list-item><list-item><p>Active malignancy, uncontrolled systemic illness, pregnancy, or inability to provide informed consent</p></list-item><list-item><p>Significant alcohol consumption within 6 mo of enrollment, defined as &#x003E;20 g per day for female individuals or &#x003E;30 g per day for male individuals or Alcohol Use Disorders Identification Test&#x2013;Consumption score of &#x2265;4 [<xref ref-type="bibr" rid="ref17">17</xref>]</p></list-item><list-item><p>Coexisting chronic liver diseases, including chronic viral hepatitis, hemochromatosis, Wilson disease, or alpha-1 antitrypsin deficiency</p></list-item><list-item><p>Active or suspected drug-induced liver injury within the prior 6 mo, including drug-induced autoimmune hepatitis</p></list-item><list-item><p>Any condition deemed by the investigators to compromise participant safety or data integrity</p></list-item></list></boxed-text></sec><sec id="s2-4"><title>Interventions</title><p>The intervention consists of the development and deployment of the AIm-PBC framework across 3 sequential phases. The first phase focuses on building an agentic AI system capable of continuous monitoring of disease activity and symptom burden. This system will integrate multiple data streams, including monthly biochemical markers, periodic elastography measurements such as LSM and SSM, and high-frequency PROs collected through validated instruments such as the WI-NRS and the PBC-40. The agent will autonomously orchestrate data ingestion, normalization, and analysis to generate an explainable disease activity index supported by SHAP-based visualizations to ensure interpretability for clinicians.</p><p>The second phase involves the creation and validation of a multi-signal predictive model for early identification of portal hypertension complications. This model will combine elastography metrics, platelet count, biochemical response trajectories, and comorbidity profiles, including AIH and MASH overlap. By leveraging gradient-boosted ensemble algorithms and explainability frameworks, the model aims to outperform existing single-modality rules and consensus criteria such as Baveno VII [<xref ref-type="bibr" rid="ref24">24</xref>], providing a noninvasive, accurate method for triaging endoscopy referrals and initiating prophylactic interventions.</p><p>The third phase operationalizes these insights through an EHR-integrated CDS prototype. Built within a SMART-on-FHIR architecture, the CDS tool will present clinicians with interpretable risk cards; dual-threshold triage cues; and guideline-based order sets for interventions such as pruritus step therapy, bone health management, and endoscopy referral. This phase includes a randomized crossover simulation to evaluate usability, decision accuracy, and cognitive load, followed by a pragmatic pilot in hepatology clinics to assess feasibility and effectiveness in real-world workflows. Collectively, these interventions aim to transform PBC care by embedding explainable AI into routine practice, improving monitoring, risk prediction, and adherence to evidence-based management strategies.</p></sec><sec id="s2-5"><title>Outcomes</title><p>The primary outcome for the first aim will be the performance of the AIm-PBC disease activity index compared to conventional monitoring strategies. This will be assessed through its calibration against established risk scores such as UK-PBC and GLOBE [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>], as well as its responsiveness to clinically meaningful changes in disease activity. The ability of the integrated symptom indexes to correlate with biochemical progression or regression will also be evaluated, providing insights into whether the inclusion of PROs enhances the sensitivity of disease monitoring. Explainability will be measured via the interpretability of SHAP-based visualizations and their perceived clinical utility during clinician evaluations.</p><p>For the second aim, the primary outcome will be the discriminatory ability of the multi-signal predictive model to identify patients at high risk of CSPH and early complications such as variceal hemorrhage or ascites. This will be quantified using the area under the receiver operating characteristic curve (AUROC), with additional measures of calibration and clinical utility assessed through decision curve analysis and net reclassification improvement. Comparative analyses will determine whether the composite model outperforms single-modality rules and consensus criteria such as Baveno VII, and subgroup analyses will explore performance consistency across patients with AIH overlap and MASH.</p><p>For the third aim, the primary outcome will be the effectiveness and usability of the EHR-integrated CDS prototype. Effectiveness will be measured via improvements in clinician adherence to guideline-concordant care pathways, including pruritus management, bone health interventions, and risk-based endoscopy referrals. Usability will be assessed using the System Usability Scale, with a target score of 70 or higher, and cognitive load will be evaluated using the NASA-Task Load Index. Clinician trust in the AI system will be measured through the AI trust scale, whereas decision accuracy and decision time will be compared between CDS-assisted and usual care conditions during the randomized crossover simulation. Feasibility indicators, including recruitment and completion rates, will be monitored during the pragmatic pilot phase.</p><p>Secondary outcomes will include fairness metrics to ensure equitable model performance across demographic and clinical subgroups, defined as an AUROC parity gap of no more than 5%. Additional exploratory outcomes will examine the impact of the intervention on workflow efficiency and clinician confidence in decision-making.</p></sec><sec id="s2-6"><title>Harms</title><p>This pilot implementation component is considered minimal risk for multiple reasons. First, the randomized crossover simulation will involve standardized simulated or deidentified patient cases rather than live clinical encounters. The participants in this simulation component will be health care providers who interact with an EHR interface in a controlled environment. The decision support tool will provide risk estimates and triage recommendations based on synthetic or deidentified data. As such, the simulation component is not expected to pose physical harm, diagnostic error affecting patient care, or adverse clinical outcomes. For the observational/model-development components, adults with PBC will contribute clinical, elastography, and patient-reported outcome data under institutional review board&#x2013;approved procedures and standard privacy protections.</p></sec><sec id="s2-7"><title>Participant Timeline</title><p>Participants will enter the study and begin with baseline assessments, which include collection of demographic information, medical history, and initial laboratory values, as well as elastography measurements for liver and spleen stiffness. At this visit, participants will also be enrolled in the PRO system, with instructions for completing the WI-NRS and the PBC-40 questionnaires. These assessments will continue throughout the observation period to capture longitudinal symptom trajectories. The schedule of enrollment, interventions, and assessments is provided in <xref ref-type="supplementary-material" rid="app5">Checklist 1</xref>.</p><p>Biochemical data will be collected at monthly intervals for the duration of the study, ensuring high-resolution monitoring of disease activity. Elastography will be repeated at predefined intervals, typically every 6 to 12 months or as clinically indicated, to track changes in liver and spleen stiffness over time. Clinical outcomes such as the development of varices, ascites, or hepatic encephalopathy will be monitored continuously through routine clinical care and documented in the study database.</p><p>For participants involved in the implementation phase, the timeline includes a randomized crossover simulation in which clinicians will manage deidentified cases under 2 conditions: usual care and CDS-assisted care. This simulation will occur after the development and validation phases are complete. Following the simulation, a pragmatic pilot will be conducted in real-world hepatology clinics, where the CDS tool will be integrated into the EHR and used during routine visits. Clinician usability and trust assessments will be administered at the end of each simulation period and again after the pilot phase.</p><p>The overall duration of participation for patients in the observational component is expected to be up to 24 months. Clinicians participating in the implementation evaluation will engage in shorter, structured sessions for simulation and a limited rollout period for the pilot.</p></sec><sec id="s2-8"><title>Sample Size and Power Considerations</title><p>Because this protocol involves model development, validation, and implementation feasibility, the planned sample size was based on expected cohort availability and anticipated outcome events rather than a conventional hypothesis-testing formula. The sample size determination for this study is primarily driven by the second aim, which focuses on validating the predictive model for CSPH. On the basis of preliminary data and published estimates, we anticipate enrolling approximately 600 patients with PBC across participating sites [<xref ref-type="bibr" rid="ref7">7</xref>]. This cohort size reflects the expected availability of retrospective and prospective data within the study time frame and ensures adequate representation of key subgroups, including patients with AIH overlap and MASH [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>].</p><p>On the basis of prior PBC cohorts, the prevalence of portal hypertension or CSPH in hepatology referral populations has been reported to range from approximately 24% to 47% depending on disease stage and case mix [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. With a projected sample of 600 participants, this corresponds to an estimated 144 to 282 CSPH events, which provides a sufficient number of outcome events to support model development and validation and evaluate improvements in model discrimination relative to established criteria such as Baveno VII.</p><p>In addition, sample size considerations accounted for model complexity. Current methodological guidance for prediction modeling recommends ensuring an adequate number of outcome events relative to the number of predictor parameters to reduce the risk of model overfitting. The anticipated event counts in this cohort are expected to support the planned set of candidate predictors while maintaining an appropriate events-per-predictor ratio for stable model estimation [<xref ref-type="bibr" rid="ref27">27</xref>].</p></sec><sec id="s2-9"><title>Recruitment</title><p>Approximately 24 hepatology clinicians will be recruited for the clinician-level randomized crossover simulation. This sample size was selected pragmatically to provide sufficient clinician-level feedback on usability, cognitive workload, trust, and workflow integration while remaining feasible for a pilot implementation study. Eligible clinicians will include hepatologists, advanced practice clinicians, and hepatology trainees with clinical experience managing patients with PBC. Participants will be recruited from hepatology clinics affiliated with academic medical centers.</p></sec><sec id="s2-10"><title>Randomization</title><p>Randomization will apply only to the implementation phase of the study during the clinician-level crossover simulation. Clinicians will be randomly assigned in a 1:1 ratio to 1 of 2 sequences: usual care followed by CDS-assisted care or CDS-assisted care followed by usual care. A computer-generated randomization schedule will be used to balance allocation between sequences and minimize allocation bias. The simulation will use standardized, deidentified cases rather than live clinical encounters.</p><p>To minimize learning and carryover effects, the 2 simulation periods will use distinct, nonoverlapping standardized cases matched in clinical complexity. A 1-week washout period will separate the 2 conditions, and case order will be varied within each period where feasible. Primary comparisons will be conducted within clinicians, allowing each participant to serve as their own control (<xref ref-type="fig" rid="figure2">Figure 2</xref>).</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>AIm-PBC clinician-level crossover randomized controlled trial pilot design. EHR: electronic health record; FTE: full-time equivalent. DO: doctor of osteopathic medicine; MD: doctor of medicine; NP: nurse practitioner; PA: physician assistant.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="resprot_v15i1e89279_fig02.png"/></fig></sec><sec id="s2-11"><title>Data Collection</title><p>Retrospective data will be sourced from institutional EHRs and data warehouses, capturing historical laboratory values, elastography reports, and clinical outcomes relevant to PBC. Prospective data collection will be conducted in outpatient hepatology clinics using secure, HIPAA (Health Insurance Portability and Accountability Act)-compliant platforms such as REDCap for PROs. These outcomes will include validated instruments such as the WI-NRS, administered twice daily to capture circadian variation in pruritus, and the PBC-40 questionnaire, administered monthly to assess quality of life domains.</p><p>Biochemical data, including ALP, bilirubin, aminotransferases, albumin, and platelet count, will be collected at monthly intervals to provide high-resolution longitudinal trajectories. LSM and SSM values will be obtained at baseline and during scheduled follow-up visits, with probe frequency and stiffness values recorded in kilopascals to ensure standardization. Clinical outcomes such as time to variceal development, ascites, and hepatic encephalopathy will be tracked over a 24-month observation period.</p><p>All data will be deidentified prior to analysis and stored in secure environments that comply with institutional and federal privacy regulations. Quality control procedures will include automated range checks for laboratory values, standardized reporting templates for elastography, and audit trails for PRO completion. Missing data will be addressed using multiple imputation techniques to minimize bias and preserve statistical power. Data integration will occur through structured pipelines that normalize heterogeneous inputs for use in machine learning models, ensuring consistency across biochemical, imaging, and symptom domains.</p></sec><sec id="s2-12"><title>AI Model Development and Validation</title><p>The predictive model will be developed using a prespecified machine learning pipeline. Candidate predictors will include longitudinal biochemical markers, platelet count, LSM, SSM, symptom scores, treatment response status, and relevant comorbidities. Features will be selected based on clinical relevance, data availability, and model stability, with highly collinear or sparsely available variables excluded or combined where appropriate.</p><p>The dataset will be divided into training, internal validation, and held-out testing subsets at the patient level to avoid data leakage. Model development will use gradient-boosted ensemble algorithms, with hyperparameters tuned within the training set using cross-validation. External validation will be performed using data from at least one participating site not used during model training where feasible.</p><p>Class imbalance will be addressed using strategies applied only within the training data, including class weighting or resampling approaches as appropriate. SHAP values will be generated to provide both patient- and cohort-level feature contributions. Model updating will not be performed during initial validation; if performance drift or poor calibration is observed during prospective deployment, recalibration or updating will be conducted using prespecified procedures and reported transparently.</p></sec><sec id="s2-13"><title>Statistical Analysis</title><p>For the first aim, longitudinal PROs and biochemical markers will be analyzed using mixed-effects models to account for within-subject correlation and repeated measures over time. These models will assess the responsiveness of integrated symptom indexes to changes in biochemical progression or regression, whereas calibration of the AIm-PBC disease activity index will be evaluated against established risk scores such as UK-PBC and GLOBE using the calibration slope, intercept, and Brier score. Discrimination will be quantified through the AUROC, and visualizations of SHAP values will be examined to confirm clinical interpretability.</p><p>For the second aim, the predictive model for CSPH complications will be developed using gradient-boosted ensemble algorithms chosen for their robustness in handling heterogeneous data. Model performance will be assessed through the AUROC for discrimination and calibration plots for agreement between predicted and observed outcomes. Clinical utility will be evaluated using decision curve analysis and net reclassification improvement to determine whether the composite model offers meaningful improvement over existing criteria. Comparative analyses will use DeLong tests to assess differences in AUROC between models, and subgroup analyses will be conducted to evaluate fairness and consistency across patients with AIH overlap and MASH. Ablation studies will quantify the incremental value of individual predictors, particularly SSM, by systematically removing variables and observing changes in performance.</p><p>For the third aim, implementation outcomes will be analyzed using both descriptive and inferential methods. Usability scores from the System Usability Scale (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), clinician trust scores from the AI trust scale adapted for AIm-PBC (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>), and cognitive load measures from the National Aeronautics and Space Administration Task Load Index (<xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>) will be summarized and compared between CDS-assisted and usual care conditions. Decision accuracy and decision time will be analyzed using 2-tailed paired <italic>t</italic> tests within the randomized crossover simulation, whereas clinician adherence to guideline-concordant care pathways will be evaluated using within-clinician comparisons across study phases. Feasibility indicators, such as recruitment and completion rates, will be reported as proportions with CIs. Qualitative debriefing interviews will be analyzed to explore clinician perceptions of usability, workflow integration, trust, and barriers to implementation (<xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>). Fairness metrics, including AUROC parity gaps across demographic and clinical subgroups, will be calculated to ensure equitable performance of the CDS tool.</p><p>All analyses will be conducted using validated statistical software packages in R (R Foundation for Statistical Computing) and Python (Python Software Foundation), with significance thresholds set at a 2-sided &#x03B1; value of .05. Missing data will be addressed through multiple imputation techniques, and sensitivity analyses will be performed to confirm the robustness of the findings.</p></sec><sec id="s2-14"><title>Ethical Considerations</title><p>Ethics approval for this study will be obtained from the Yale University Human Research Protection Program prior to initiation. The protocol will be registered on ClinicalTrials.gov, and the registration record will be maintained and updated throughout the study to reflect any amendments or changes in status. The approved protocol version number and date will be displayed on all study documents, including the analysis plan, and any site-specific requirements mandated by participating clinics will be honored to ensure compliance with local governance standards.</p><p>This study will be conducted across multiple academic centers under a coordinated governance framework. Each participating site will obtain local institutional review board approval or reliance agreements as appropriate. Data sharing arrangements will be governed by formal data use agreements between institutions, ensuring compliance with HIPAA and applicable federal and institutional privacy regulations. All shared datasets will be deidentified prior to transfer and stored in secure, access-controlled environments. All participants will provide written informed consent prior to participation.</p><p>A central study steering committee comprising investigators with expertise in hepatology, data science, and implementation science will oversee study conduct, protocol adherence, and data integrity. Algorithm development and validation will be conducted within secure computing environments with version control and audit trails.</p><p>During the implementation phase, oversight of the CDS tool will include monitoring for safety, usability, and unintended consequences. Because the CDS tool is intended to support, not replace, clinician decision-making, final clinical decisions will remain at the discretion of the treating clinician. Any unexpected system behavior, performance concerns, or workflow disruptions identified during simulation or pilot deployment will be documented and reviewed by the study team, with predefined procedures for modification or suspension of the tool if necessary.</p><p>Any protocol amendments that materially affect eligibility criteria, study outcomes, data collection procedures, statistical analysis methods, consent language, or confidentiality protections will be submitted to the institutional review board for review and approval before implementation. The study team will maintain a comprehensive version history documenting the rationale for each change, along with dates and approvals. When amendments alter information that participants relied upon to provide informed consent, the research team will reconsent all active participants using revised documents. Substantive amendments will also be reflected in the ClinicalTrials.gov record and communicated to site leaders and stakeholders involved in recruitment and oversight.</p><p>This protocol has been developed in accordance with the SPIRIT (Standard Protocol Items: Recommendations for Interventional Trials) guidelines (<xref ref-type="supplementary-material" rid="app5">Checklist 1</xref>) [<xref ref-type="bibr" rid="ref28">28</xref>]. A SPIRIT figure outlining the schedule of enrollment, interventions, and assessments is available in <xref ref-type="supplementary-material" rid="app5">Checklist 1</xref>. Upon completion, study findings will be disseminated through peer-reviewed publications, presentations at national and international conferences, and summaries shared with participating sites. The final dataset, stripped of identifiers, will be made available through controlled-access repositories under appropriate data sharing agreements to promote reproducibility and secondary analyses. Results will be reported regardless of outcome, and any deviations from the original protocol will be clearly documented and justified in the final manuscript. Additionally, the ClinicalTrials.gov record will be updated with summary results in compliance with federal requirements.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><p>At the time of manuscript submission, this protocol had not yet begun participant recruitment or data analysis. No participants had been recruited. The study did not receive external funding; therefore, no funding date is applicable. Data collection is projected to begin after institutional review board approval and ClinicalTrials.gov registration, with retrospective data extraction and prospective observational data collection expected to occur over approximately 24 months. The clinician-level randomized crossover simulation and pragmatic pilot implementation phases are expected to occur after model development and validation are completed. Data analysis will begin after completion of the relevant data collection phases. The main study findings are expected to be submitted for publication in summer 2029.</p><p>The integrated disease activity index is expected to show strong calibration with established prognostic scores and greater responsiveness to clinically meaningful changes, whereas the inclusion of PROs will provide a more comprehensive view of symptom burden. The predictive model is expected to achieve an AUROC of at least 0.85 for identifying CSPH and deliver a net reclassification improvement of 10% or more over Baveno VII criteria, reducing unnecessary endoscopies without compromising safety. Finally, the CDS prototype is expected to improve clinician adherence to guideline-concordant care pathways, reduce decision time, and achieve high usability and trust scores during the simulation and pilot phases.</p></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Results</title><p>This protocol describes a multiphase study aimed at improving the management of PBC through an explainable AI framework. The anticipated results include a dynamic disease activity index that integrates biochemical, elastography, and patient-reported data, offering superior responsiveness and calibration compared to conventional monitoring. The predictive model is expected to achieve high discrimination for CSPH and outperform existing criteria, reducing unnecessary endoscopies while maintaining patient safety. Finally, the CDS prototype is designed to enhance clinician adherence to guideline-based care, improve decision accuracy, and reduce cognitive load, with usability and trust scores meeting or exceeding established benchmarks.</p></sec><sec id="s4-2"><title>Limitations</title><p>Several limitations must be acknowledged. The study relies on data from hepatology clinics affiliated with academic centers, which may limit generalizability to community settings. The observational component depends on accurate and complete longitudinal data, and missing data could introduce bias despite planned imputation strategies. Additionally, the implementation phase uses simulated cases before real-world deployment, which may not fully capture the complexity of clinical workflows. Finally, while explainability frameworks are incorporated, clinician adoption of AI tools may still be influenced by factors beyond technical performance, such as institutional culture and resource constraints.</p></sec><sec id="s4-3"><title>Comparison With Prior Work</title><p>Previous efforts in PBC management have focused primarily on biochemical monitoring and static risk scores such as UK-PBC and GLOBE, which do not account for dynamic symptom burden or integrate noninvasive imaging markers. Similarly, consensus criteria provide useful surrogates for portal hypertension but lack individualized predictive capability. Machine learning models have shown promise in chronic liver disease, yet most operate as opaque systems, limiting clinician trust and adoption. This study builds on these foundations by introducing an explainable, multi-signal approach that combines objective and patient-reported data, integrates noninvasive imaging, and operationalizes insights through EHR-based decision support.</p></sec><sec id="s4-4"><title>Conclusions</title><p>If successful, this study will demonstrate the feasibility and clinical utility of an explainable AI framework for PBC care, offering a scalable model for precision hepatology. By improving monitoring, risk prediction, and adherence to evidence-based management, the AIm-PBC system has the potential to reduce symptom burden, prevent complications, and enhance quality of life for patients. Future research will focus on external validation across diverse populations and health systems, as well as exploring integration with emerging biomarkers and digital health technologies to further refine predictive accuracy and patient engagement.</p></sec></sec></body><back><ack><p>The authors used ChatGPT by OpenAI [<xref ref-type="bibr" rid="ref29">29</xref>] solely to assist with language editing and improving the clarity of portions of the manuscript. No generative artificial intelligence tools were used to generate scientific content, perform analyses, interpret results, or develop the study design. All scientific concepts, methodology, and conclusions were developed by the authors, who take full responsibility for the content of the manuscript.</p><p>All authors declared that they had insufficient or no funding to support open access publication of this manuscript, including from affiliated organizations or institutions, funding agencies, or other organizations. JMIR Publications provided article processing fee support for the publication of this article.</p></ack><notes><sec><title>Funding</title><p>The authors received no financial support for the research, authorship, and/or publication of this article.</p></sec><sec><title>Data Availability</title><p>Data sharing is not applicable to this article as no datasets were generated or analyzed during this protocol.</p></sec></notes><fn-group><fn fn-type="con"><p>BN and USK conceived the study and designed the research protocol. BN led the development of the conceptual framework and methodological approach. USK contributed to study design refinement and implementation strategy. Both authors contributed to drafting the manuscript, critically revised it for intellectual content, and approved the final version.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">AIH</term><def><p>autoimmune hepatitis</p></def></def-item><def-item><term id="abb3">ALP</term><def><p>alkaline phosphatase</p></def></def-item><def-item><term id="abb4">AUROC</term><def><p>area under the receiver operating characteristic curve</p></def></def-item><def-item><term id="abb5">CDS</term><def><p>clinical decision support</p></def></def-item><def-item><term id="abb6">CSPH </term><def><p>clinically significant portal hypertension</p></def></def-item><def-item><term id="abb7">EHR</term><def><p>electronic health record</p></def></def-item><def-item><term id="abb8">HIPAA </term><def><p>Health Insurance Portability and Accountability Act</p></def></def-item><def-item><term id="abb9">LSM</term><def><p>liver stiffness measurement</p></def></def-item><def-item><term id="abb10">MASH</term><def><p>metabolic dysfunction&#x2013;associated steatohepatitis</p></def></def-item><def-item><term id="abb11">PBC</term><def><p>primary biliary cholangitis</p></def></def-item><def-item><term id="abb12">PRO</term><def><p>patient-reported outcome</p></def></def-item><def-item><term id="abb13">REDCap</term><def><p>Research Electronic Data Capture</p></def></def-item><def-item><term id="abb14">SHAP</term><def><p>Shapley additive explanations</p></def></def-item><def-item><term id="abb15">SMART-on-FIHR</term><def><p>Substitutable Medical Applications, Reusable Technologies on Fast Healthcare Interoperability Resources</p></def></def-item><def-item><term id="abb16">SPIRIT</term><def><p>Standard Protocol Items: Recommendations for Interventional Trials</p></def></def-item><def-item><term id="abb17">SSM</term><def><p>spleen stiffness measurement</p></def></def-item><def-item><term id="abb18">WI-NRS</term><def><p>Worst Itch Numeric Rating Scale</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Levy</surname><given-names>C</given-names> </name><name name-style="western"><surname>Manns</surname><given-names>M</given-names> </name><name name-style="western"><surname>Hirschfield</surname><given-names>G</given-names> </name></person-group><article-title>New treatment paradigms in primary biliary cholangitis</article-title><source>Clin Gastroenterol Hepatol</source><year>2023</year><month>07</month><volume>21</volume><issue>8</issue><fpage>2076</fpage><lpage>2087</lpage><pub-id pub-id-type="doi">10.1016/j.cgh.2023.02.005</pub-id><pub-id pub-id-type="medline">36809835</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lindor</surname><given-names>KD</given-names> </name><name name-style="western"><surname>Bowlus</surname><given-names>CL</given-names> </name><name name-style="western"><surname>Boyer</surname><given-names>J</given-names> </name><name name-style="western"><surname>Levy</surname><given-names>C</given-names> </name><name name-style="western"><surname>Mayo</surname><given-names>M</given-names> </name></person-group><article-title>Primary biliary cholangitis: 2018 practice guidance from the American Association for the Study of Liver Diseases</article-title><source>Hepatology</source><year>2019</year><month>01</month><volume>69</volume><issue>1</issue><fpage>394</fpage><lpage>419</lpage><pub-id pub-id-type="doi">10.1002/hep.30145</pub-id><pub-id pub-id-type="medline">30070375</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alvaro</surname><given-names>D</given-names> </name><name name-style="western"><surname>Calvaruso</surname><given-names>V</given-names> </name><name name-style="western"><surname>Carbone</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Quality measures to enhance the management and treatment of primary biliary cholangitis: a Delphi consensus study</article-title><source>Liver Int</source><year>2025</year><month>06</month><volume>45</volume><issue>6</issue><fpage>e70118</fpage><pub-id pub-id-type="doi">10.1111/liv.70118</pub-id><pub-id pub-id-type="medline">40318123</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>European Association for the Study of the Liver</collab></person-group><article-title>EASL Clinical Practice Guidelines: the diagnosis and management of patients with primary biliary cholangitis</article-title><source>J Hepatol</source><year>2017</year><month>07</month><volume>67</volume><issue>1</issue><fpage>145</fpage><lpage>172</lpage><pub-id pub-id-type="doi">10.1016/j.jhep.2017.03.022</pub-id><pub-id pub-id-type="medline">28427765</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Barba Bernal</surname><given-names>R</given-names> </name><name name-style="western"><surname>Ferrigno</surname><given-names>B</given-names> </name><name name-style="western"><surname>Medina Morales</surname><given-names>E</given-names> </name><etal/></person-group><article-title>Management of primary biliary cholangitis: current treatment and future perspectives</article-title><source>Turk J Gastroenterol</source><year>2023</year><month>02</month><volume>34</volume><issue>2</issue><fpage>89</fpage><lpage>100</lpage><pub-id pub-id-type="doi">10.5152/tjg.2023.22239</pub-id><pub-id pub-id-type="medline">36843300</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Momah</surname><given-names>N</given-names> </name><name name-style="western"><surname>Silveira</surname><given-names>MG</given-names> </name><name name-style="western"><surname>Jorgensen</surname><given-names>R</given-names> </name><name name-style="western"><surname>Sinakos</surname><given-names>E</given-names> </name><name name-style="western"><surname>Lindor</surname><given-names>KD</given-names> </name></person-group><article-title>Optimizing biochemical markers as endpoints for clinical trials in primary biliary cirrhosis</article-title><source>Liver Int</source><year>2012</year><month>05</month><volume>32</volume><issue>5</issue><fpage>790</fpage><lpage>795</lpage><pub-id pub-id-type="doi">10.1111/j.1478-3231.2011.02678.x</pub-id><pub-id pub-id-type="medline">22136310</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Trivella</surname><given-names>J</given-names> </name><name name-style="western"><surname>John</surname><given-names>BV</given-names> </name><name name-style="western"><surname>Levy</surname><given-names>C</given-names> </name></person-group><article-title>Primary biliary cholangitis: epidemiology, prognosis, and treatment</article-title><source>Hepatol Commun</source><year>2023</year><month>06</month><day>1</day><volume>7</volume><issue>6</issue><fpage>e0179</fpage><pub-id pub-id-type="doi">10.1097/HC9.0000000000000179</pub-id><pub-id pub-id-type="medline">37267215</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Martini</surname><given-names>F</given-names> </name><name name-style="western"><surname>Balducci</surname><given-names>D</given-names> </name><name name-style="western"><surname>Mancinelli</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Risk stratification in primary biliary cholangitis</article-title><source>J Clin Med</source><year>2023</year><month>09</month><day>1</day><volume>12</volume><issue>17</issue><fpage>5713</fpage><pub-id pub-id-type="doi">10.3390/jcm12175713</pub-id><pub-id pub-id-type="medline">37685780</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xu</surname><given-names>X</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Rui</surname><given-names>F</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>C</given-names> </name><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name></person-group><article-title>Spleen stiffness measurement as a non-invasive assessment in patients with portal hypertension</article-title><source>eGastroenterology</source><year>2024</year><month>02</month><volume>2</volume><issue>1</issue><fpage>e100031</fpage><pub-id pub-id-type="doi">10.1136/egastro-2023-100031</pub-id><pub-id pub-id-type="medline">39944747</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>HP</given-names> </name><name name-style="western"><surname>Lieber</surname><given-names>SR</given-names> </name><name name-style="western"><surname>Rogers</surname><given-names>ME</given-names> </name><etal/></person-group><article-title>A systematic review of patient-reported outcomes in primary biliary cholangitis and primary sclerosing cholangitis</article-title><source>Hepatol Commun</source><year>2020</year><volume>4</volume><issue>10</issue><fpage>1502</fpage><lpage>1515</lpage><pub-id pub-id-type="doi">10.1002/hep4.1567</pub-id><pub-id pub-id-type="medline">33024919</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gelhorn</surname><given-names>H</given-names> </name><name name-style="western"><surname>Currie</surname><given-names>BM</given-names> </name><name name-style="western"><surname>Bushnell</surname><given-names>DM</given-names> </name><etal/></person-group><article-title>Psychometric validation of the Worst Itch Numerical Rating Scale (WI-NRS) and other patient-reported outcome measures for assessing severity and impact of pruritus in patients with primary biliary cholangitis</article-title><source>Orphanet J Rare Dis</source><year>2025</year><month>07</month><day>31</day><volume>20</volume><issue>1</issue><fpage>390</fpage><pub-id pub-id-type="doi">10.1186/s13023-025-03798-x</pub-id><pub-id pub-id-type="medline">40745549</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gerussi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Verda</surname><given-names>D</given-names> </name><name name-style="western"><surname>Bernasconi</surname><given-names>DP</given-names> </name><etal/></person-group><article-title>Machine learning in primary biliary cholangitis: a novel approach for risk stratification</article-title><source>Liver Int</source><year>2022</year><month>03</month><volume>42</volume><issue>3</issue><fpage>615</fpage><lpage>627</lpage><pub-id pub-id-type="doi">10.1111/liv.15141</pub-id><pub-id pub-id-type="medline">34951722</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Njei</surname><given-names>B</given-names> </name><name name-style="western"><surname>Osta</surname><given-names>E</given-names> </name><name name-style="western"><surname>Njei</surname><given-names>N</given-names> </name><name name-style="western"><surname>Al-Ajlouni</surname><given-names>YA</given-names> </name><name name-style="western"><surname>Lim</surname><given-names>JK</given-names> </name></person-group><article-title>An explainable machine learning model for prediction of high-risk nonalcoholic steatohepatitis</article-title><source>Sci Rep</source><year>2024</year><month>04</month><day>13</day><volume>14</volume><issue>1</issue><fpage>8589</fpage><pub-id pub-id-type="doi">10.1038/s41598-024-59183-4</pub-id><pub-id pub-id-type="medline">38615137</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Njei</surname><given-names>B</given-names> </name><name name-style="western"><surname>Osta</surname><given-names>E</given-names> </name><name name-style="western"><surname>Ilagan-Ying</surname><given-names>YC</given-names> </name><etal/></person-group><article-title>534: FibroX: an explainable AI model for accurate prediction of advanced liver fibrosis and cardiovascular mortality in MASLD</article-title><source>Gastroenterology</source><year>2025</year><month>05</month><volume>169</volume><issue>1</issue><fpage>S131</fpage><pub-id pub-id-type="doi">10.1016/S0016-5085(25)01246-6</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Montano-Loza</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>Corpechot</surname><given-names>C</given-names> </name></person-group><article-title>Definition and management of patients with primary biliary cholangitis and an incomplete response to therapy</article-title><source>Clin Gastroenterol Hepatol</source><year>2021</year><month>11</month><volume>19</volume><issue>11</issue><fpage>2241</fpage><lpage>2251.e1</lpage><pub-id pub-id-type="doi">10.1016/j.cgh.2020.06.062</pub-id><pub-id pub-id-type="medline">32629125</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Tsoris</surname><given-names>A</given-names> </name><name name-style="western"><surname>Marlar</surname><given-names>CA</given-names> </name></person-group><article-title>Use of the Child Pugh score in liver disease</article-title><source>StatPearls</source><year>2019</year><publisher-name>StatPearls Publishing</publisher-name></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Higgins-Biddle</surname><given-names>JC</given-names> </name><name name-style="western"><surname>Babor</surname><given-names>TF</given-names> </name></person-group><article-title>A review of the Alcohol Use Disorders Identification Test (AUDIT), AUDIT-C, and USAUDIT for screening in the United States: past issues and future directions</article-title><source>Am J Drug Alcohol Abuse</source><year>2018</year><volume>44</volume><issue>6</issue><fpage>578</fpage><lpage>586</lpage><pub-id pub-id-type="doi">10.1080/00952990.2018.1456545</pub-id><pub-id pub-id-type="medline">29723083</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chazouill&#x00E8;res</surname><given-names>O</given-names> </name><name name-style="western"><surname>Wendum</surname><given-names>D</given-names> </name><name name-style="western"><surname>Serfaty</surname><given-names>L</given-names> </name><name name-style="western"><surname>Montembault</surname><given-names>S</given-names> </name><name name-style="western"><surname>Rosmorduc</surname><given-names>O</given-names> </name><name name-style="western"><surname>Poupon</surname><given-names>R</given-names> </name></person-group><article-title>Primary biliary cirrhosis-autoimmune hepatitis overlap syndrome: clinical features and response to therapy</article-title><source>Hepatology</source><year>1998</year><month>08</month><volume>28</volume><issue>2</issue><fpage>296</fpage><lpage>301</lpage><pub-id pub-id-type="doi">10.1002/hep.510280203</pub-id><pub-id pub-id-type="medline">9695990</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jiang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>BH</given-names> </name><name name-style="western"><surname>Rodgers</surname><given-names>B</given-names> </name><name name-style="western"><surname>Pyrsopoulos</surname><given-names>N</given-names> </name></person-group><article-title>Characteristics and inpatient outcomes of primary biliary cholangitis and autoimmune hepatitis overlap syndrome</article-title><source>J Clin Transl Hepatol</source><year>2021</year><month>06</month><day>28</day><volume>9</volume><issue>3</issue><fpage>392</fpage><lpage>398</lpage><pub-id pub-id-type="doi">10.14218/JCTH.2021.00008</pub-id><pub-id pub-id-type="medline">34221925</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hern&#x00E1;ndez-P&#x00E9;rez</surname><given-names>M</given-names> </name><name name-style="western"><surname>Riado</surname><given-names>D</given-names> </name><name name-style="western"><surname>Pena</surname><given-names>E</given-names> </name><etal/></person-group><article-title>The overlap with metabolic dysfunction-associated steatotic liver disease negatively affects outcomes of primary biliary cholangitis</article-title><source>Aliment Pharmacol Ther</source><year>2024</year><month>09</month><volume>60</volume><issue>5</issue><fpage>613</fpage><lpage>619</lpage><pub-id pub-id-type="doi">10.1111/apt.18134</pub-id><pub-id pub-id-type="medline">38924185</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zachariah</surname><given-names>M</given-names> </name><name name-style="western"><surname>Cook</surname><given-names>J</given-names> </name><name name-style="western"><surname>Burrows</surname><given-names>M</given-names> </name><name name-style="western"><surname>Eljack</surname><given-names>A</given-names> </name><name name-style="western"><surname>Patanwala</surname><given-names>I</given-names> </name></person-group><article-title>P211&#x2005;Prevalence of metabolic dysfunction-associated steatotic liver disease and its impact on primary biliary cholangitis</article-title><source>Gut</source><year>2025</year><access-date>2026-06-02</access-date><volume>74</volume><fpage>A213</fpage><lpage>A214</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://gut.bmj.com/content/74/Suppl_1/A213.2.info">https://gut.bmj.com/content/74/Suppl_1/A213.2.info</ext-link></comment></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Carbone</surname><given-names>M</given-names> </name><name name-style="western"><surname>Sharp</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Flack</surname><given-names>S</given-names> </name><etal/></person-group><article-title>The UK-PBC risk scores: derivation and validation of a scoring system for long-term prediction of end-stage liver disease in primary biliary cholangitis</article-title><source>Hepatology</source><year>2016</year><month>03</month><volume>63</volume><issue>3</issue><fpage>930</fpage><lpage>950</lpage><pub-id pub-id-type="doi">10.1002/hep.28017</pub-id><pub-id pub-id-type="medline">26223498</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Marenco-Flores</surname><given-names>A</given-names> </name><name name-style="western"><surname>Rojas Amaris</surname><given-names>N</given-names> </name><name name-style="western"><surname>Kahan</surname><given-names>T</given-names> </name><etal/></person-group><article-title>The external validation of GLOBE and UK-PBC risk scores for predicting ursodeoxycholic acid treatment response in a large U.S. cohort of primary biliary cholangitis patients</article-title><source>J Clin Med</source><year>2024</year><month>08</month><day>1</day><volume>13</volume><issue>15</issue><fpage>4497</fpage><pub-id pub-id-type="doi">10.3390/jcm13154497</pub-id><pub-id pub-id-type="medline">39124763</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>de Franchis</surname><given-names>R</given-names> </name><name name-style="western"><surname>Bosch</surname><given-names>J</given-names> </name><name name-style="western"><surname>Garcia-Tsao</surname><given-names>G</given-names> </name><name name-style="western"><surname>Reiberger</surname><given-names>T</given-names> </name><name name-style="western"><surname>Ripoll</surname><given-names>C</given-names> </name><collab>Baveno VII Faculty</collab></person-group><article-title>Baveno VII - renewing consensus in portal hypertension</article-title><source>J Hepatol</source><year>2022</year><month>04</month><volume>76</volume><issue>4</issue><fpage>959</fpage><lpage>974</lpage><pub-id pub-id-type="doi">10.1016/j.jhep.2021.12.022</pub-id><pub-id pub-id-type="medline">35120736</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Lai</surname><given-names>H</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Clinically significant portal hypertension in patients with primary biliary cholangitis: clinicopathological features and prognostic value</article-title><source>Ann Hepatol</source><year>2025</year><volume>30</volume><issue>1</issue><fpage>101577</fpage><pub-id pub-id-type="doi">10.1016/j.aohep.2024.101577</pub-id><pub-id pub-id-type="medline">39276989</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hu</surname><given-names>YF</given-names> </name><name name-style="western"><surname>Li</surname><given-names>SX</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>HL</given-names> </name><etal/></person-group><article-title>Precirrhotic primary biliary cholangitis with portal hypertension: bile duct injury correlate</article-title><source>Gut Liver</source><year>2024</year><month>09</month><day>15</day><volume>18</volume><issue>5</issue><fpage>867</fpage><lpage>876</lpage><pub-id pub-id-type="doi">10.5009/gnl230468</pub-id><pub-id pub-id-type="medline">38623061</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Riley</surname><given-names>RD</given-names> </name><name name-style="western"><surname>Snell</surname><given-names>KI</given-names> </name><name name-style="western"><surname>Ensor</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Minimum sample size for developing a multivariable prediction model: PART II - binary and time-to-event outcomes</article-title><source>Stat Med</source><year>2019</year><month>03</month><day>30</day><volume>38</volume><issue>7</issue><fpage>1276</fpage><lpage>1296</lpage><pub-id pub-id-type="doi">10.1002/sim.7992</pub-id><pub-id pub-id-type="medline">30357870</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chan</surname><given-names>AW</given-names> </name><name name-style="western"><surname>Boutron</surname><given-names>I</given-names> </name><name name-style="western"><surname>Hopewell</surname><given-names>S</given-names> </name><etal/></person-group><article-title>SPIRIT 2025 statement: updated guideline for protocols of randomised trials</article-title><source>Lancet</source><year>2025</year><month>05</month><volume>405</volume><issue>10491</issue><fpage>e19</fpage><lpage>e27</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(25)00770-6</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="web"><person-group person-group-type="author"><collab>OpenAI</collab></person-group><article-title>ChatGPT</article-title><access-date>2026-06-12</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://chatgpt.com/">https://chatgpt.com/</ext-link></comment></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>System Usability Scale.</p><media xlink:href="resprot_v15i1e89279_app1.docx" xlink:title="DOCX File, 15 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>AI -Trust Scale (adapted for the AIm-PBC).</p><media xlink:href="resprot_v15i1e89279_app2.docx" xlink:title="DOCX File, 15 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>NASA Task Load Index.</p><media xlink:href="resprot_v15i1e89279_app3.docx" xlink:title="DOCX File, 15 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>Qualitative debriefing interview guide.</p><media xlink:href="resprot_v15i1e89279_app4.docx" xlink:title="DOCX File, 16 KB"/></supplementary-material><supplementary-material id="app5"><label>Checklist 1</label><p>SPIRIT (Standard Protocol Items: Recommendations for Interventional Trials) 2025 participant timeline for the AIm-PBC pilot provider-level crossover randomized controlled trial.</p><media xlink:href="resprot_v15i1e89279_app5.docx" xlink:title="DOCX File, 18 KB"/></supplementary-material></app-group></back></article>