<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Res Protoc</journal-id><journal-id journal-id-type="publisher-id">ResProt</journal-id><journal-id journal-id-type="index">5</journal-id><journal-title>JMIR Research Protocols</journal-title><abbrev-journal-title>JMIR Res Protoc</abbrev-journal-title><issn pub-type="epub">1929-0748</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v15i1e95236</article-id><article-id pub-id-type="doi">10.2196/95236</article-id><article-categories><subj-group subj-group-type="heading"><subject>Protocol</subject></subj-group></article-categories><title-group><article-title>Machine Learning&#x2013;Based Predictive Model for Functional Independence in Spinal Cord Injury: Protocol for a Predictive Rule Development and Validation Study</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Perez-Sanpablo</surname><given-names>Alberto Isaac</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Rodriguez-Barragan</surname><given-names>Marlene Alejandra</given-names></name><degrees>MD, MSc</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Meneses-Pe&#x00F1;aloza</surname><given-names>Alicia</given-names></name><degrees>MD, MSc</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Quinza&#x00F1;os-Fresnedo</surname><given-names>Jimena</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Barrera-Ortiz</surname><given-names>Aida</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Palomino-Ramos</surname><given-names>Fabiola Monserrat</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Prado-Escobar</surname><given-names>Oscar</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Rodr&#x00ED;guez</surname><given-names>Marcela D</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lopez-Nava</surname><given-names>Irvin Hussein</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ambrosio-Bastian</surname><given-names>Jose</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff6">6</xref></contrib></contrib-group><aff id="aff1"><institution>Motion Analysis and Rehabilitation Engineering Lab, Instituto Nacional de Rehabilitaci&#x00F3;n</institution><addr-line>Mexico City</addr-line><country>Mexico</country></aff><aff id="aff2"><institution>Neurologic Rehabilitation Division, Instituto Nacional de Rehabilitaci&#x00F3;n</institution><addr-line>Mexico-Xochimilco Av. 289</addr-line><addr-line>Mexico City</addr-line><country>Mexico</country></aff><aff id="aff3"><institution>Pediatric Rehabilitation Division, Instituto Nacional de Rehabilitaci&#x00F3;n</institution><addr-line>Mexico City</addr-line><country>Mexico</country></aff><aff id="aff4"><institution>Faculty of Engineering, Universidad Aut&#x00F3;noma de Baja California</institution><addr-line>Mexicali</addr-line><addr-line>Baja California</addr-line><country>Mexico</country></aff><aff id="aff5"><institution>Data Science and Machine Learning Lab, Centro de Investigaci&#x00F3;n Cient&#x00ED;fica y de Educaci&#x00F3;n Superior de Ensenada (CICESE)</institution><addr-line>Ensenada</addr-line><addr-line>Baja California</addr-line><country>Mexico</country></aff><aff id="aff6"><institution>Universidad Tecnol&#x00F3;gica de M&#x00E9;xico (UNITEC)</institution><addr-line>Mexico City</addr-line><country>Mexico</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Sarvestan</surname><given-names>Javad</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Jimena Quinza&#x00F1;os-Fresnedo, MD, PhD, Neurologic Rehabilitation Division, Instituto Nacional de Rehabilitaci&#x00F3;n, Mexico-Xochimilco Av. 289, Mexico City, 14389, Mexico, 52 5559991000 ext 13410; <email>jimenaquinzanos@gmail.com</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>3</day><month>7</month><year>2026</year></pub-date><volume>15</volume><elocation-id>e95236</elocation-id><history><date date-type="received"><day>22</day><month>03</month><year>2026</year></date><date date-type="rev-recd"><day>05</day><month>05</month><year>2026</year></date><date date-type="accepted"><day>08</day><month>05</month><year>2026</year></date></history><copyright-statement>&#x00A9; Alberto Isaac Perez-Sanpablo, Marlene Alejandra Rodriguez-Barragan, Alicia Meneses-Pe&#x00F1;aloza, Jimena Quinza&#x00F1;os-Fresnedo, Aida Barrera-Ortiz, Fabiola Monserrat Palomino-Ramos, Oscar Prado-Escobar, Marcela D Rodr&#x00ED;guez, Irvin Hussein Lopez-Nava, Jose Ambrosio-Bastian. Originally published in JMIR Research Protocols (<ext-link ext-link-type="uri" xlink:href="https://www.researchprotocols.org">https://www.researchprotocols.org</ext-link>), 3.7.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Research Protocols, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.researchprotocols.org">https://www.researchprotocols.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://www.researchprotocols.org/2026/1/e95236"/><abstract><sec><title>Background</title><p>Spinal cord injury (SCI) causes substantial disability by disrupting spinal pathways, making functional independence a central rehabilitation goal. In 2024, approximately 15.4 million people worldwide were living with SCI. Despite its clinical relevance, traditional prognostic tools, notably the International Standards for Neurological Classification of Spinal Cord Injury (ISNCSCI), have limitations. Furthermore, access to advanced diagnostics constrains prediction. Existing models often fail to estimate independence, limiting goal setting and resource planning.</p></sec><sec><title>Objective</title><p>This study aims to develop and validate machine learning (ML)&#x2013;based rules that predict functional independence, as measured by the Spinal Cord Independence Measure, version III (SCIM-III), at 3, 6, and 12 months post injury in individuals with SCI. The model combines clinical admission predictors, readily available to enhance predictive performance: age, sex, time since injury, upper and lower extremity strength, ISNCSCI data (American Spinal Injury Association Impairment Scale grade and neurologic level of injury), rehabilitation type, and the Trunk Control Scale score validated by the research team.</p></sec><sec sec-type="methods"><title>Methods</title><p>Using retrospective electronic clinical records (2015&#x2010;2026) from Mexico&#x2019;s Nacional de Rehabilitaci&#x00F3;n Luis Guillermo Ibarra Ibarra (INR LGII; a tertiary national rehabilitation reference center) for model development and a prospective independent cohort (October 2026-October 2027) for external validation, the study will develop ML models to accurately and generally predict SCIM-III outcomes. Eligible participants are adults (&#x2265;18 years of age) with subacute or chronic SCI. Six architectures are compared: linear regression, classification and regression tree, categorical boosting (gradient boosting algorithm), light gradient boosting machine, multilayer perceptron, and Gaussian process regression, using 10-fold stratified cross-validation for internal validation. Performance is assessed by root-mean-square error, mean absolute error, <italic>R</italic>&#x00B2;, area under the curve, calibration plots, and decision curve analysis. The approach prioritizes reproducibility, interpretability, and clinical applicability, addressing prior models&#x2019; limitations (small sample sizes, limited validation, and impractical input requirements). Key steps include data preprocessing, feature selection, model training with appropriate algorithms, and robust evaluation against existing prognostic benchmarks. External validation and ethical considerations are integrated, with commitments to data sharing where feasible.</p></sec><sec sec-type="results"><title>Results</title><p>The study was approved and funded in October 2025. The retrospective development cohort targets 500 registries (from 2025&#x2010;2026) collected between October 2025 and June 2026. A total of 119 records were processed by March 2026. ML development is planned between June 2026 and March 2027. The external prospective validation cohort (n=100) is planned for October 2026-October 2027, and validation for June 2027-March 2028. Results are expected by January 2028.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>A reliable, clinically actionable ML-based prediction tool that estimates SCIM-III trajectories to support goal setting, rehabilitation planning, and resource allocation in SCI care will be developed. Model performance will be benchmarked against published SCI prediction rules, and it will be considered clinically useful if it outperforms the mean-score baseline and existing rules on the prospective validation cohort.</p></sec><sec><title>Trial Registration</title><p>Open Science Framework osf.io/4fmy6; https://osf.io/4fmy6/overview</p></sec><sec sec-type="registered-report"><title>International Registered Report Identifier (IRRID)</title><p>DERR1-10.2196/95236</p></sec></abstract><kwd-group><kwd>spinal cord injury</kwd><kwd>prognosis</kwd><kwd>machine learning</kwd><kwd>functional independence</kwd><kwd>SCIM-III</kwd><kwd>predictive modeling</kwd><kwd>rehabilitation</kwd><kwd>artificial intelligence</kwd><kwd>trunk control</kwd></kwd-group><custom-meta-wrap><custom-meta><meta-name>ext-peer-rev</meta-name><meta-value>The proposal for this study was externally peer-reviewed by the Secretar&#x00ED;a de Ciencia, Humanidades, Tecnolog&#x00ED;a e Innovaci&#x00F3;n (SECIHTI, Mexico). See the Peer Review Report for details</meta-value></custom-meta></custom-meta-wrap></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Overview</title><p>Spinal cord injury (SCI) is an important cause of disability due to the impairment of the ascending and descending pathways of the spinal cord. This is why effective SCI rehabilitation includes patient-centered goal setting by the patient, their family, and the multidisciplinary team attending to them. Goal setting helps identify a person&#x2019;s needs, values, and expectations and is ultimately regarded as a central principle in rehabilitation. Nevertheless, there is some controversy about how to establish goal setting [<xref ref-type="bibr" rid="ref1">1</xref>]. Prognostic tools can objectively help establish those goals, as previously demonstrated [<xref ref-type="bibr" rid="ref2">2</xref>].</p><p>In 2026, the principal clinical tool for predicting recovery and function is the International Standards for Neurological Classification of Spinal Cord Injury (ISNCSCI). Nevertheless, those standards have some limitations in their prediction properties [<xref ref-type="bibr" rid="ref3">3</xref>]. In particular, a ceiling effect for mild injuries (American Spinal Injury Association Impairment Scale [AIS] D), and the potential for misclassification at the time of the initial examination or follow-up have been described. Other studied prediction works use magnetic resonance imaging (MRI), cerebrospinal fluid biomarkers, and neurophysiological measures, which are difficult to access for many care centers and are typically performed in the first hours following the injury, a situation that does not usually occur in many places [<xref ref-type="bibr" rid="ref4">4</xref>].</p><p>Clinical prediction rules, a subset of clinical indicators to predict outcomes or assist in clinical decisions, have been developed as prognostic tools [<xref ref-type="bibr" rid="ref5">5</xref>]. The majority of them focus on independent walking prediction, and use regression models that are not the best prediction model [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. A recent study focuses on independence and uses a classification regression tree. Still, the main outcome is the Functional Independence Measure score, which is not specific to people with SCI, and whose study population was limited to individuals with cervical SCI, which undermines its applicability [<xref ref-type="bibr" rid="ref8">8</xref>].</p><p>Machine learning (ML) helps find a predictive model that better fits reality [<xref ref-type="bibr" rid="ref9">9</xref>]. Also, using specific, validated tools is necessary to make a prognosis after an SCI. So, the main objective of our work is to develop and validate ML-based rules predicting Spinal Cord Independence Measure, version III (SCIM-III) at 3, 6, and 12 months in individuals with SCI.</p></sec><sec id="s1-2"><title>Background</title><p>Neurological diseases are the leading cause of disability worldwide, and in Mexico, SCI is among the most frequent conditions requiring rehabilitation care. SCI is one of the most complex pathologies in rehabilitation medicine due to its direct impact on functionality, independence, and quality of life of affected individuals [<xref ref-type="bibr" rid="ref10">10</xref>]. People with this diagnosis, many of whom are working age, would benefit from precise prognoses to guide rehabilitation goals, optimize resources, and improve patient-caregiver communication. However, health inequalities may affect SCI rehabilitation outcomes in Mexico: lower-income and rural populations may face delayed access to specialized centers such as Instituto Nacional de Rehabilitaci&#x00F3;n Luis Guillermo Ibarra Ibarra (INR LGII). These disparities may influence functional trajectories and are considered in the interpretation of model generalizability.</p><p>Although these variables have been used as inputs in functional prediction models under development in 2026, clinical decision-making still depends largely on individual clinical judgment, which may lead to uncertainty in goal setting, institutional burden, or uncertainty for patients and caregivers [<xref ref-type="bibr" rid="ref11">11</xref>]. Some clinical rules allow partial anticipation of functional recovery, in particular concerning walking ability, but few have demonstrated a significant effect in clinical practice [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. Several studies have identified that variables such as injury severity classification (AIS), neurological level of injury, Upper Extremity Motor Score (UEMS), Lower Extremity Motor Score (LEMS), and Trunk Control Scale (ECT) have prognostic value [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. However, there are few tools capable of predicting overall functional independence, as comprehensively measured by the SCIM-III [<xref ref-type="bibr" rid="ref14">14</xref>].</p><p>In the multidisciplinary management of individuals following SCI, it is essential to have tangible, measurable, and objective tools to estimate functional prognosis in the short, medium, and long term. Several approaches currently allow preliminary predictions based primarily on the severity and neurological level of injury, using the American Spinal Injury Association classification or the AIS. However, despite their clinical usefulness, these measures alone may not fully capture the complexity of functional recovery, highlighting the need for objective and reproducible prognostic tools that can support clinical decision-making and rehabilitation planning.</p><p>MRI plays a fundamental role in the evaluation of SCI, as it allows detailed assessment of spinal cord involvement and surrounding soft tissues, enabling the identification of the severity of neurological damage and the potential for recovery. In this context, MRI-based scoring systems, such as the Brain and Spinal Injury Center score, have demonstrated utility in predicting neurological outcomes in individuals with acute SCI.</p><p>Other predictive strategies include the timing of posttraumatic surgical intervention, as multiple studies and meta-analyses have demonstrated that early surgical decompression (within the first 24 hours) is associated with a higher probability of neurological improvement as measured by the AIS.</p><p>In addition, several structural and neuroinflammatory biomarkers related to SCI have been identified. These biomarkers are derived from disruption of the blood-spinal cord barrier and from inflammatory processes occurring after the injury. Among the most studied are neurofilaments, glial fibrillary acidic protein, phosphorylated neurofilament heavy chain, and other proteins detected in cerebrospinal fluid and blood, whose concentrations have been correlated with injury severity and the potential for neurological recovery. These findings suggest that biomarkers may contribute in the future to improving the prediction of functional outcomes in individuals with SCI.</p><p>Although neurological assessment using ISNCSCI and the AIS classification allows estimation of SCI severity and provides guidance regarding neurological prognosis, their ability to predict overall functional independence remains limited. Tools such as the SCIM-III were developed specifically for SCI to provide a more comprehensive evaluation of functional performance in activities of daily living. However, although these instruments allow the assessment of functional status in individuals with SCI, their capacity to accurately predict future functional independence remains limited, which has motivated the development of more advanced predictive models capable of integrating multiple clinical and functional variables into objective prognostic frameworks [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>].</p><p>ML has been applied in the field of medicine for various purposes, including disease diagnosis, drug development, and the analysis of medical data. This approach offers several advantages in the prediction and development of prognostic models for certain diseases compared with traditional statistical methods, such as linear or logistic regression. Specifically, it imposes fewer restrictions on the number of predictors derived from a given dataset and is well-suited for identifying complex nonlinear relationships within data.</p><p>In the context of SCI, ML has already been applied in studies focusing on quality of life, duration of opioid prescription, length of stay in intensive care units, and, more recently, in the prediction of walking outcomes [<xref ref-type="bibr" rid="ref17">17</xref>].</p><p>This new wave of research studies the highly complex problem of predicting personalized rehabilitation trajectories, using multimodal, longitudinal, and often incomplete datasets. Such an approach has high potential clinical and social impact and represents a transition toward computational evidence-based individualized medicine.</p><p>Despite the growing data supporting these approaches, no studies conducted in Mexico or Latin America have validated a predictive rule for the SCIM-III score or integrated the ECT developed by members of our research group [<xref ref-type="bibr" rid="ref13">13</xref>]. At the INR LGII, trunk control assessment is a key component of treatment planning. Trunk control has been identified as an accurate predictor of functional independence, demonstrating high sensitivity and specificity [<xref ref-type="bibr" rid="ref13">13</xref>].</p><p>The clinical ECT developed at our institution has led to subsequent research conducted at our center, which demonstrated its prognostic validity for predicting functional independence and walking ability in individuals with SCI, highlighting trunk stability as a relevant clinical indicator of functional outcomes. These findings support the integration of trunk control assessment into prognostic models of rehabilitation outcomes.</p><p>In addition, recent technological advances have expanded the possibilities for a more objective evaluation of trunk function. The validation of inertial measurement units for the assessment of trunk control in individuals with SCI has shown that wearable sensors can provide reliable and quantitative measurements of postural control during functional tasks.</p><p>Together, these advances reinforce the potential for integrating traditional clinical assessments with technological tools to improve prognostic accuracy. Based on these institutional achievements, our center is well-positioned to contribute to the development of clinical prediction rules for functional independence in SCI, integrating traditional neurological variables with trunk control assessment and emerging quantitative tools [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>].</p></sec><sec id="s1-3"><title>Hypothesis and Research Question</title><p>Previous research has identified several early clinical variables associated with neurological and functional recovery following SCI. Factors such as age, motor strength in key myotomes, sensory preservation in specific dermatomes, and the presence of sacral sparing (S4-S5) have consistently been reported as relevant indicators of neurological recovery and long-term functional outcomes. In particular, certain myotomes and dermatomes have special clinical relevance for predicting walking ability. Among the most important myotomes are L3 (quadriceps femoris, responsible for knee extension) and S1 (gastrocnemius-soleus complex, responsible for plantar flexion), as muscle strength in these groups is closely associated with the ability to support body weight and generate the propulsion required for ambulation. From a sensory perspective, the L3 and S1 dermatomes, assessed through light touch and pinprick sensation, have also demonstrated prognostic value in several clinical models of walking recovery. Likewise, the preservation of sensation in the sacral segments S4-S5, known as sacral sparing, represents one of the most important predictors of neurological improvement, as it reflects the integrity of residual neural pathways below the level of injury [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref19">19</xref>].</p><p>However, our research group has demonstrated that global independence is more relevant than walking ability in determining quality of life [<xref ref-type="bibr" rid="ref13">13</xref>]. The ECT developed at the INR LGII has shown high correlations with functional outcomes and may improve predictive performance, since the ISNCSCI does not evaluate trunk musculature [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. Therefore, combining this scale with artificial intelligence techniques could lead to the development of a new, more accurate, and clinically useful prediction rule.</p><p>This leads to the following hypothesis: it is possible to develop a reliable and clinically relevant functional prediction rule to estimate the SCIM-III score in individuals with SCI using clinical variables such as age, time since injury, upper and lower extremity strength (UEMS and LEMS), and trunk control through the use of multivariate statistical models and ML algorithms. This hypothesis gives rise to the following research question: Is it feasible to develop a consistent and valid functional prediction rule to estimate the SCIM-III score in individuals with SCI based on selected clinical variables and using ML models?</p></sec><sec id="s1-4"><title>Justification</title><p>At the INR LGII, approximately 2500 participants from across the country are treated annually, primarily individuals of working age who may benefit from a more accurate prognosis to plan rehabilitation goals, optimize resources, and improve communication of expectations [<xref ref-type="bibr" rid="ref20">20</xref>]. Combining artificial intelligence with validated clinical variables in a predictive model will not only fill an important knowledge gap in Mexico but will also help advance neurological rehabilitation, strengthen health equity, and promote the training of specialized human resources. This project could benefit this population, as well as 30 specialist physicians and trainees, institutions, and professionals across the country involved in SCI rehabilitation, and more than 20,000 professionals in Mexico working in neurological rehabilitation.</p><p>The proposal is consistent with the objectives of the Basic and Frontier Science 2025 call by generating original frontier knowledge in a critical and rapidly growing health field, using ML to predict functional outcomes in SCI participants.</p></sec><sec id="s1-5"><title>Objectives</title><p>The main objective of this work is to develop and validate ML-based rules predicting independence, as measured by SCIM-III, at 3, 6, and 12 months post injury in individuals with SCI. Secondary objectives include:</p><list list-type="bullet"><list-item><p>To build a database of clinical variables in clinical records of individuals with SCI readily available in low-resource rehabilitation settings, such as age, time since injury, upper and lower extremity strength (UEMS/LEMS), trunk control, and ISNCSCI data</p></list-item><list-item><p>To identify the best predictors using statistics and ML models.</p></list-item><list-item><p>To select and validate the best-performing model, generating a practical clinical prediction rule for functional independence estimation.</p></list-item><list-item><p>To disseminate results through open-access publications, conference presentations, and scientific training activities for rehabilitation students.</p></list-item></list></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design</title><p>This is an observational, analytical, mixed design (retrospective-prospective) study. The study consists of two components: (1) a retrospective review of existing electronic clinical records of individuals with SCI treated at INR LGII, and (2) a prospective follow-up with a 12-month SCIM-III assessment.</p></sec><sec id="s2-2"><title>Setting</title><p>The study will be conducted at the INR LGII, a tertiary care national reference center for rehabilitation medicine in Mexico City, Mexico. The INR LGII receives individuals from all regions of the country and is the largest SCI rehabilitation center in Mexico.</p></sec><sec id="s2-3"><title>Participants</title><p><xref ref-type="other" rid="box1">Textbox 1</xref> presents the inclusion and exclusion criteria of participants throughout the study phases.</p><boxed-text id="box1"><title> Inclusion and exclusion criteria for all study phases.</title><p><bold>Inclusion criteria for the retrospective phase</bold></p><list list-type="bullet"><list-item><p>Age &#x2265;18 years at time of spinal cord injury (SCI)</p></list-item><list-item><p>Confirmed diagnosis of subacute or chronic SCI (traumatic or nontraumatic)</p></list-item><list-item><p>Clinical follow-up at the Instituto Nacional de Rehabilitaci&#x00F3;n Luis Guillermo Ibarra IbarraI with evaluations at 3, 6, and/or 12 months post admission to rehabilitation</p></list-item><list-item><p>Complete clinical records with the following variables: Spinal Cord Independence Measure, version III, American Spinal Injury Association Impairment Scale grade, Upper Extremity Motor Score, Lower Extremity Motor Score, Trunk Control Scale, age, sex, type of rehabilitation, and time since injury</p></list-item></list><p><bold>Inclusion Criteria for the Prospective Phase</bold></p><list list-type="bullet"><list-item><p>Age &#x2265;18 years at time of SCI</p></list-item><list-item><p>Confirmed diagnosis of subacute or chronic SCI (traumatic or nontraumatic)</p></list-item><list-item><p>Signed informed consent</p></list-item></list><p><bold>Exclusion criteria for retrospective and prospective phases</bold></p><list list-type="bullet"><list-item><p>Confirmed diagnosis of severe comorbid neurological conditions independent of SCI (eg, stroke, traumatic brain injury, and neurodegenerative disease)</p></list-item><list-item><p>No motor deficit attributable to SCI</p></list-item><list-item><p>Age &#x003C;18 years</p></list-item></list></boxed-text></sec><sec id="s2-4"><title>Elimination Criteria for Both Phases</title><p>The following elimination criteria will apply to both retrospective and prospective phases:</p><list list-type="bullet"><list-item><p>Records with more than 30% missing data for the defined predictor variables.</p></list-item><list-item><p>Records with serious data entry inaccuracies or errors preventing reliable analysis.</p></list-item><list-item><p>Records duplicated.</p></list-item><list-item><p>Withdrawal of consent during the prospective data collection stage.</p></list-item></list></sec><sec id="s2-5"><title>Sample Size</title><p>Our target is a total of at least 500 patient records for internal development and validation, plus a separate external temporal validation cohort of 100 new patients (prospectively recruited from October 2026 to October 2027). Unlike hypothesis-testing sample size calculations, ML validation studies aim to estimate predictive performance accurately (low bias) and precisely (narrow CIs). Most studies on clinical ML-based prediction models do not justify the sample size [<xref ref-type="bibr" rid="ref21">21</xref>], since there is no universally accepted standard method for sample size in ML. To address this gap, we adopted a pragmatic, mixed methods approach to justify the sample size based on:</p><list list-type="bullet"><list-item><p>Model complexity and number of predictors<italic>:</italic> our nonlinear algorithms (gradient boosting and neural networks) require larger sample sizes than regression models [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. With up to 9 predictors, a sample of 500 patients provides a predictor-to-sample ratio of &#x003E;50:1. This ratio exceeds those generally proposed for ML studies, as well as those used in clinical prediction studies (eg, 20:1 or 37:1 from [<xref ref-type="bibr" rid="ref24">24</xref>]). Consequently, this ratio is sufficient to learn meaningful patterns without memorizing noise, thus reducing the risk of overfitting.</p></list-item><list-item><p>Validation needs: based on common practices in clinical ML studies, recent research has used 15%&#x2010;30% of the data for external validation [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. Accordingly, we defined 20% (100 patients) as the external test set. This proportion allows us to evaluate the final model performance on unseen data without compromising the training or hyperparameter validation phases.</p></list-item></list></sec><sec id="s2-6"><title>Variables</title><sec id="s2-6-1"><title>Outcome Variable</title><p>The primary outcome variable will be the SCIM-III score at 3, 6, and 12 months post admission. SCIM-III is a validated SCI-specific measure of functional independence, with higher scores reflecting greater independence [<xref ref-type="bibr" rid="ref16">16</xref>].</p></sec><sec id="s2-6-2"><title>Predictor Variables</title><p>Predictor variables, definitions, and measurement scales used for model development are shown in <xref ref-type="table" rid="table1">Table 1</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Candidate predictor variables, clinical definitions, and encoding strategies for model development.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Variable</td><td align="left" valign="bottom">Description</td><td align="left" valign="bottom">Scale/units</td></tr></thead><tbody><tr><td align="left" valign="top">Age</td><td align="left" valign="top">Age at SCI<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> onset</td><td align="left" valign="top">Years (continuous)</td></tr><tr><td align="left" valign="top">Sex</td><td align="left" valign="top">Biological sex</td><td align="left" valign="top">Male/female (binary)</td></tr><tr><td align="left" valign="top">Time since injury</td><td align="left" valign="top">Months from SCI to rehabilitation admission</td><td align="left" valign="top">Days (continuous); normalized (<italic>z</italic> score)</td></tr><tr><td align="left" valign="top">AIS<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup> grade</td><td align="left" valign="top">American Spinal Injury Association Impairment Scale (neurological completeness)</td><td align="left" valign="top">A, B, C, D; one-hot encoded for model training</td></tr><tr><td align="left" valign="top">UEMS<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">Upper Extremity Motor Score (ISNCSCI<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup>)</td><td align="left" valign="top">0&#x2010;50 (continuous)</td></tr><tr><td align="left" valign="top">LEMS<sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup></td><td align="left" valign="top">Lower Extremity Motor Score (ISNCSCI)</td><td align="left" valign="top">0&#x2010;50 (continuous)</td></tr><tr><td align="left" valign="top">ECT<sup><xref ref-type="table-fn" rid="table1fn6">f</xref></sup></td><td align="left" valign="top">Trunk Control Scale (developed at INR LGII)<sup><xref ref-type="table-fn" rid="table1fn7">g</xref></sup></td><td align="left" valign="top">0&#x2010;23 (ordinal, treated as continuous numeric)</td></tr><tr><td align="left" valign="top">Rehabilitation type</td><td align="left" valign="top">Type of rehabilitation program received</td><td align="left" valign="top">Categorical</td></tr><tr><td align="left" valign="top">Neurological level of injury</td><td align="left" valign="top">Cervical, thoracic, lumbar, or sacral level as determined by ISNCSCI examination at admission</td><td align="left" valign="top">Categorical (ordinal descending C1&#x2192;S5); encoded as ordinal integer</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>SCI: spinal cord injury. </p></fn><fn id="table1fn2"><p><sup>b</sup>AIS: American Spinal Injury Association Impairment Scale. </p></fn><fn id="table1fn3"><p><sup>c</sup>UEMS: Upper Extremity Motor Score. </p></fn><fn id="table1fn4"><p><sup>d</sup>ISNCSCI: International Standards for Neurological Classification of Spinal Cord Injury.</p></fn><fn id="table1fn5"><p><sup>e</sup>LEMS: Lower Extremity Motor Score.</p></fn><fn id="table1fn6"><p><sup>f</sup>ECT: Trunk Control Scale.</p></fn><fn id="table1fn7"><p><sup>g</sup>INR LGII: Instituto Nacional de Rehabilitaci&#x00F3;n Luis Guillermo Ibarra Ibarra.</p></fn></table-wrap-foot></table-wrap><p>Researchers include rehabilitation type as a predictor variable since it is part of the context of the patient preceding and affecting outcomes. Due to the observational nature of the study, researchers do not assume modifications in rehabilitation treatment between model application and outcome assessment. Researchers will conduct sensitivity analyses to evaluate potential effect modification on SCIM-III prediction by stratification by rehabilitation type.</p></sec></sec><sec id="s2-7"><title>Data Collection Procedure</title><p>During the first phase of the study, trained personnel started in October 2025, retrospective data collection from the INR LGII institutional electronic clinical records system covering the period from January 2015 to June 2026, following a standardized data extraction protocol. Retrospective data will be used to train ML models. Three board-certified rehabilitation physiatrists with &#x2265;2 years of experience in SCI rehabilitation are responsible for predictor assessments (AIS/ISNCSCI classification and ECT scoring) at INR LGII. Prior to data collection, evaluators will complete a standardized calibration session to ensure interrater consistency, documented in the data quality manual. All records will be anonymized at extraction, replacing personal identifiers with study codes. Investigators will define in the data quality manual procedure for data entry, missing data handling, range checks, and interrater consistency for clinically judged variables. As mentioned before, an external validation cohort of 100 new patient records will be prospectively recruited (October 2026-October 2027), consistent with recommendations for temporal validation in clinical ML studies [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. During this prospective component (2026&#x2010;2027), new participants admitted to INR LGII who meet the eligibility criteria will be prospectively enrolled in the external validation cohort. Participants will be initially evaluated to determine all clinical variables (AIS, UEMS, LEMS, and ECT) at 3, 6, and 12 months post admission.</p><p>In those individuals, clinical investigators will evaluate SCIM-III following the Catz et al [<xref ref-type="bibr" rid="ref16">16</xref>] protocol. Two board-certified rehabilitation physiatrists with experience in SCI rehabilitation will administer SCIM-III assessments. Evaluators will be blinded to predictor values at the time of SCIM-III evaluation. Admission variables (AIS, UEMS, LEMS, and ECT) will not be accessed during outcome measurement, preventing label leakage. Interrater reliability will be established through a standardized calibration session. Blinding procedures will be documented in the data quality manual. Clinical records used in the prospective component will not overlap with datasets used previously for the development of the models. No patient record from the prospective cohort will appear in the retrospective development dataset (2015&#x2010;2026), ensuring complete independence between development and validation data. Investigators will analyze any dataset differences to assess model generalizability.</p><p>Investigators will store data in password-protected institutional equipment, complying with Mexico&#x2019;s Ley General de Protecci&#x00F3;n de Datos Personales en Posesi&#x00F3;n de Sujetos Obligados and INR LGII ethical requirements.</p></sec><sec id="s2-8"><title>ML Model Development (Preprocessing)</title><p>Prior to model development, the dataset will undergo descriptive statistical analysis to examine the distributions, frequencies, and patterns of missing data. Exploratory correlation analyses will be conducted using Pearson and Spearman coefficients and correlation matrices to identify relevant predictors of SCIM-III and detect multicollinearity among variables.</p><p>Handling of missing data: a 2-step imputation strategy will be applied to address the missing data. Variables with less than 10% missing data will be addressed using median or mode imputation according to their distribution; those with 10%&#x2010;30% missingness will receive multivariate regression imputation with predictive mean matching. Records with more than 30% missing data in the defined predictor variables will be excluded according to the elimination criteria. Sensitivity analyses will compare the imputed datasets with complete case analyses to assess the stability of imputation decisions.</p><p>Feature preprocessing and encoding: categorical variables will be encoded as follows: AIS grades via one-hot encoding to avoid artificial ordinality, sex as a binary variable (0/1), and type of rehabilitation as a nominal variable with one-hot encoding. Continuous variables, including UEMS, LEMS, ECT, age, and time since injury, will undergo range validation, followed by <italic>z</italic> score normalization for the multilayer perceptron (MLP), minimum-maximum scaling for tree-based models, and Gaussian process regression (GPR). If the correlation analysis detects predictor redundancy, dimensionality reduction using principal component analysis (PCA) will be applied. All preprocessing decisions will be recorded in a version-controlled log to ensure complete reproducibility of the results. All preprocessing parameters (imputation values, normalization coefficients, and encoding mappings) will be derived from the training data and stored as part of the final model object for application to new observations without recalculation.</p><p>Variable selection: 3 complementary strategies will be combined: (1) filter methods using univariate statistics (Pearson/Spearman correlation and ANOVA <italic>F</italic> tests), (2) embedded methods based on model-derived importance (Gini impurity for trees, regularized coefficients for linear models), and (3) wrapper methods using recursive feature elimination with cross-validated performance as the selection criterion. The final inclusion of a predictor will require the convergence of at least 2 strategies and justification of clinical interpretability.</p><p>Researchers will apply all preprocessing steps uniformly across groups since no group-specific transformations are expected.</p></sec><sec id="s2-9"><title>Model Training</title><p>Six predictive model architectures will be trained and compared, ranging from interpretable statistical baselines to high-capacity nonlinear algorithms, with the goal of identifying the most suitable approach for predicting SCIM-III scores at 3, 6, and 12 months post admission. Given that SCIM-III is modeled as a continuous outcome in the primary analysis, model performance will be primarily evaluated using regression metrics, including root-mean-square error (RMSE), mean absolute error, and calibration measures (eg, prediction calibration and calibration plots), as well as prediction error quantified through prediction or CIs around the predicted scores.</p><p>Model architectures are as follows: (1) multivariate linear regression will serve as an interpretable statistical baseline; (2) decision trees (classification and regression tree [CART]) will generate transparent IF-THEN clinical rules with pruning and maximum depth constraints to limit overfitting; (3) categorical boosting (CatBoost; gradient boosting algorithm) natively handles categorical variables and class imbalances without the need for additional preprocessing; (4) light gradient boosting machine (LightGBM) will be tuned for the efficient handling of large data volumes and predictor importance ranking; (5) an MLP will be implemented with 2 hidden layers, Rectified Linear Unit or Leaky Rectified Linear Unit activation functions, Adam or Stochastic gradient descent optimization, and batch normalization; and (6) GPR will provide probabilistic predictions with 95% calibrated credible intervals to quantify predictive uncertainty.</p><p>Hyperparameter optimization: an initial random search will explore the hyperparameter space, and Bayesian optimization will perform fine-tuning. The architecture and regularization parameters of the MLP, depth and splitting criteria of CART, learning rates and regularization terms for CatBoost and LightGBM, and kernel selection for GPR will be adjusted based on performance in 10-fold stratified cross-validation.</p><p>Implementation and reproducibility: all models will be implemented in Python using scikit-learn, TensorFlow/Keras, or equivalent libraries with fixed random seeds. The dataset will be split according to a 60/20/20 (training/validation/test) scheme, with 10-fold stratified cross-validation applied during training. Investigators will allocate all records from the same individual (initial, 3, 6, and 12 months) to the same partition (training, validation, or test) and to the same fold during 10-fold cross-validation to prevent participant-level data leakage across subsets. Codes, model configurations, and preprocessing pipelines will be made available on Open Science Framework (OSF) and GitHub after publication in accordance with JMIR&#x2019;s open science requirements.</p></sec><sec id="s2-10"><title>Overfitting Prevention</title><p>To ensure generalizable models and mitigate overfitting&#x2014;where models learn noise rather than underlying relationships&#x2014;a multifaceted strategy will be implemented throughout development, structured around 6 approaches.</p><sec id="s2-10-1"><title>Data-Centric Regularization</title><p>The following data-centric strategies will be implemented to reduce overfitting and improve model generalizability:</p><list list-type="bullet"><list-item><p>Hold out: a rigorous data partitioning strategy will be used from the outset. The dataset will be divided into training (60%), validation (20%), and test (20%) sets. The validation set will be used exclusively for hyperparameter tuning and model selection, while the test set will be held back entirely until the final model evaluation to provide an unbiased estimate of its real-world performance.</p></list-item></list><list list-type="bullet"><list-item><p>Cross-validation: all model training and hyperparameter optimization will be guided by stratified 10-fold cross-validation on the training set. This technique partitions the training data into 10 complementary subsets, iteratively training on 9 and validating on 1. This maximizes the use of available data for training and provides a more robust and less noisy estimate of model performance than a single train/validation split, making the model selection process more resilient to overfitting.</p></list-item></list></sec><sec id="s2-10-2"><title>Algorithmic Regularization Techniques</title><p>Model-specific regularization will be a cornerstone of our approach to constrain model complexity:</p><list list-type="bullet"><list-item><p>For neural networks (MLP): we will use dropout (randomly ignoring a fraction of neurons during training), L1/L2 weight regularization (penalizing large weights), batch normalization (stabilizing layer inputs), and early stopping (halting training when performance on the validation set ceases to improve).</p></list-item><list-item><p>For decision trees (CART): tree growth will be constrained using prepruning (eg, limiting maximum depth or minimum samples per leaf) and post pruning (cost-complexity pruning) to prevent the tree from becoming overly specific to the training data.</p></list-item><list-item><p>For ensemble methods (CatBoost and LightGBM): we will use shrinkage (learning rate) to slow down the learning process and L1/L2 regularization terms directly within the boosting objective function to penalize model complexity.</p></list-item><list-item><p>For GPR: the flexibility of the model will be controlled by selecting appropriate kernels and incorporating a noise kernel to explicitly model and account for irreducible noise in the data, preventing the model from fitting to it.</p></list-item></list></sec><sec id="s2-10-3"><title>Feature Selection and Dimensionality Reduction</title><p>As detailed in the preprocessing section, rigorous feature selection using filter, wrapper, and embedded methods will eliminate redundant predictors, reducing the model&#x2019;s &#x201C;degrees of freedom&#x201D; and lowering overfitting risk. If predictor redundancy is high, PCA will be considered to compress the feature space while retaining the signal.</p><p>To ensure that no information from validation or test data contaminates model development, all preprocessing steps&#x2014;including missing data imputation, normalization/scaling, feature encoding, dimensionality reduction (PCA), and feature selection&#x2014;will be performed exclusively within the training partition. During k-fold cross-validation, these transformations will be fitted on each training fold and applied to the corresponding held-out fold without refitting, ensuring that no statistics computed from validation data influence the model. The same fitted preprocessing parameters from the final training set will be stored and applied unchanged to the external validation cohort. Hyperparameter tuning will likewise rely solely on cross-validated performance within the training data. This workflow ensures that performance estimates reflect true generalization rather than optimistic bias from information leakage.</p></sec><sec id="s2-10-4"><title>Simplicity via the Principle of Parsimony</title><p>Model selection will not be based solely on raw predictive performance (eg, <italic>R</italic><sup>2</sup>). We will explicitly consider model complexity using information criteria (for linear models) and by comparing the performance of simpler, more interpretable models (eg, multivariate linear regression and shallow decision trees) against more complex ones. A more complex model will only be selected if it provides a substantial and clinically meaningful improvement in performance on the validation set, thereby favoring simpler and inherently more generalizable solutions when their performance is comparable.</p></sec><sec id="s2-10-5"><title>Conservative Hyperparameter Optimization</title><p>The hyperparameter search space will be carefully defined to avoid extreme configurations known to cause overfitting (eg, excessively deep trees and very high learning rates). Optimization, guided by cross-validation performance, will explicitly minimize validation error, not training error. Bayesian optimization is particularly advantageous here, efficiently exploring the trade-off between complexity and performance.</p></sec><sec id="s2-10-6"><title>Final and Unbiased Performance Evaluation</title><p>Upon completion of all development and tuning using the retrospective cohort, the final optimal models will be evaluated on the prospective external validation cohort (n=100, recruited October 2026-October 2027). This temporal separation provides an unbiased estimate of true generalizability and expected clinical performance, the ultimate safeguard against inadvertent overfitting during iterative development. Researchers will examine model stability through bootstrap resampling (1000 iterations) to quantify the variability of individual predictions and performance estimates across bootstrap samples.</p><p>By integrating these 6 strategies, the project will systematically minimize overfitting risk, ensuring the developed ML-based rules are robust and clinically useful for predicting functional independence after SCI.</p></sec></sec><sec id="s2-11"><title>Model Evaluation</title><p>Model interpretability will be assessed using Shapley additive explanations (SHAP) values to quantify predictor contributions at both global and individual prediction levels. Investigators will analyze subgroup fairness by reporting model performance (RMSE, <italic>R</italic>&#x00B2;) stratified by sex, age group (18&#x2010;40, 41&#x2010;60, and &#x003E;60 years), AIS grade, and time since injury. Also, researchers will report subgroup sample sizes and CIs, and if the RMSE ratio exceeds 1.5 across groups, investigators will explore recalibration within underperforming subgroups. Full model performance measures are included in <xref ref-type="table" rid="table2">Table 2</xref>.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Performance metrics and clinical relevance for the evaluation of the predictive model.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Metric</td><td align="left" valign="bottom">Application</td><td align="left" valign="bottom">Clinical relevance</td></tr></thead><tbody><tr><td align="left" valign="top">RMSE<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td><td align="left" valign="top">Regression accuracy</td><td align="left" valign="top">Prediction error in SCIM-III<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup> points</td></tr><tr><td align="left" valign="top">MAE<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup></td><td align="left" valign="top">Average absolute error</td><td align="left" valign="top">Interpretable error magnitude</td></tr><tr><td align="left" valign="top"><italic>R</italic>&#x00B2;</td><td align="left" valign="top">Variance explained</td><td align="left" valign="top">Model fit quality</td></tr><tr><td align="left" valign="top">AUROC<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup></td><td align="left" valign="top">Binary classification (functional threshold)</td><td align="left" valign="top">Discrimination between functional categories</td></tr><tr><td align="left" valign="top">Sensitivity/specificity</td><td align="left" valign="top">Threshold-based classification</td><td align="left" valign="top">Clinical decision support performance</td></tr><tr><td align="left" valign="top">Calibration plot+Hosmer-Lemeshow</td><td align="left" valign="top">Agreement between predicted and observed SCIM-III (continuous calibration); goodness-of-fit for threshold classifications</td><td align="left" valign="top">Model reliability for clinical decision-making</td></tr><tr><td align="left" valign="top">Decision curve analysis</td><td align="left" valign="top">Net benefit of using the model versus treat-all or treat-none strategies across a range of clinical decision thresholds</td><td align="left" valign="top">Clinical utility: justifies model adoption over simpler clinical rules.</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>RMSE: root-mean-square error.</p></fn><fn id="table2fn2"><p><sup>b</sup>SCIM-III: Spinal Cord Independence Measure, version III.</p></fn><fn id="table2fn3"><p><sup>c</sup>MAE: mean absolute error.</p></fn><fn id="table2fn4"><p><sup>d</sup>AUROC: area under the receiver operating characteristic curve.</p></fn></table-wrap-foot></table-wrap><p>Additional considerations for model evaluation are described below:</p><list list-type="bullet"><list-item><p>A trivial statistical baseline (predicting the mean SCIM-III score) will define the minimum acceptable performance for the continuous prediction task. Models must significantly outperform this baseline using regression-based performance metrics (eg, RMSE, mean absolute error, <italic>R</italic>&#x00B2;, and calibration) to demonstrate clinical usefulness.</p></list-item><list-item><p>Secondary classification analyses will binarize SCIM-III scores using clinically meaningful thresholds. A score of &#x2265;55 will represent functional independence sufficient for discharge planning, while &#x2265;75 will indicate high independence. For these secondary dichotomized outcomes, performance will be summarized using the area under the receiver operating characteristic curve, sensitivity, specificity, and decision-curve analysis, and area under the curve (AUC) values will be compared using the DeLong test with 95% CIs.</p></list-item><list-item><p>Both thresholds will be reported with clinical justification. The primary model output remains a continuous SCIM-III prediction, with classification analyses considered exploratory secondary outcomes.</p></list-item></list></sec><sec id="s2-12"><title>External Validation</title><p>The best-performing model will undergo external validation in a prospective independent cohort of 100 new patient records not used during training, recruited between October 2026 and October 2027. This temporal separation constitutes a more stringent test than random partitioning, as it captures potential shifts in patient characteristics or clinical practices over time [<xref ref-type="bibr" rid="ref27">27</xref>]. The prospective validation cohort (2026&#x2010;2027) and the retrospective development cohort (2015&#x2010;2026) will share identical eligibility criteria, predictor definitions, and SCIM-III outcome protocol. Investigators will assess potential differences in case-mix, rehabilitation practice patterns, or data completeness between periods through descriptive comparison prior to model evaluation. All preprocessing parameters derived from the training set&#x2014;including imputation values, normalization coefficients, and encoding mappings&#x2014;will be applied without recalculation to the validation cohort to prevent information leakage.</p><p>Validation will assess calibration (calibration plots, Hosmer-Lemeshow test, Bland-Altman limits of agreement, and Pearson correlation between predicted and observed SCIM-III scores) and discrimination (RMSE and AUC) using unseen data. CIs (95%) will be estimated via bootstrap resampling (2000 iterations). Performance degradation exceeding 0.05 in AUC between internal and external validation will trigger a prespecified covariate shift analysis.</p><p>Model performance will be benchmarked against published prediction rules using comparable predictors [<xref ref-type="bibr" rid="ref14">14</xref>]. Subgroup analyses will examine predictive accuracy across AIS grade, age groups, and time since injury to identify heterogeneity and support clinically tailored application of the prediction model.</p></sec><sec id="s2-13"><title>Model Output and AI-Specific Considerations</title><p>Models will output a continuous predicted SCIM-III score (0&#x2010;100) at 3, 6, and 12 months post admission, framing the primary task as regression. Classification labels will only appear in secondary analyses using clinically meaningful SCIM-III thresholds. GPR will additionally provide 95% credible intervals to quantify prediction uncertainty [<xref ref-type="bibr" rid="ref17">17</xref>]. To enhance clinical transparency, individual predictions will be accompanied by SHAP values identifying the contribution of each predictor to the estimated SCIM-III score [<xref ref-type="bibr" rid="ref28">28</xref>].</p><p>The model is intended as a clinical decision support tool to inform rehabilitation goal-setting and discharge planning, not to replace clinical judgment. Rehabilitation clinicians will enter 8 admission variables (age, sex, time since injury, AIS grade, UEMS, LEMS, ECT, and rehabilitation type). The backend will automatically perform preprocessing, encoding, and prediction. If predictor values are unavailable at the time of prediction, the system will flag the affected variables and apply the imputation parameters derived from the training set. Results will present a clinically interpretable SCIM-III estimate accompanied by its uncertainty interval. The prototype will initially be tested by investigators; clinician usability testing is planned in later project stages.</p><p>Because the primary task is regression, class imbalance methods are not required. For secondary classification analyses using SCIM-III thresholds, imbalance will be evaluated; if ratios exceed 3:1, stratified sampling and precision-recall metrics will complement the area under the receiver operating characteristic curve evaluation.</p><p>Researchers planned the model to be used by trained rehabilitation clinicians capable of reliably performing ISNCSCI classification, SCIM-III, and ECT scoring. An onboarding guide embedded in the application interface will orient new users. Users without formal ISNCSCI, SCIM-III, and ECT training should complete structured training prior to clinical use.</p></sec><sec id="s2-14"><title>Ethical Considerations</title><p>The study was reviewed and approved by the Research Committee and Ethics in Research Committee of the INR LGII (protocol INRLGII 128/25, approved October 21, 2025).</p><p>Study follows Helsinki Declaration and Mexican regulations [<xref ref-type="bibr" rid="ref29">29</xref>]; retrospective anonymized records exempt consent. For prospective data collection, written informed consent will be obtained from all participants or their legal representatives. Participants will be clearly informed about the study objectives, procedures, potential risks, and the use of their clinical and rehabilitation data for developing and validating an ML-based predictive model. This study is classified as minimal risk, as it involves secondary analysis of existing clinical data without direct intervention. Nonetheless, potential psychological or social implications related to predictive outcomes will be carefully considered, particularly regarding how prognostic information may influence patient expectations. Predictive results will not be used as the sole basis for clinical decision-making. Personal identifiers will be removed, and datasets will be anonymized or deidentified prior to analysis. Data will be stored securely with restricted access, and safeguards will be implemented to prevent unauthorized use or re-identification. Data will be used exclusively for the purposes outlined in this protocol. Any secondary use will require additional ethical approval.</p><p>Formal patient and public involvement in study design was not incorporated, given the retrospective nature of the primary data source and the early development stage. Patient perspectives were informally considered during protocol design through consultation with INR LGII rehabilitation physiatrists who provided clinical input on SCIM-III threshold values and workflow integration. In the last year, a structured usability study with rehabilitation clinicians and patient advisory input will be conducted and reported separately. The authors acknowledge the significance of patient co-design in AI clinical tools and commit to incorporating patient and caregiver views before clinical deployment.</p><p>This study is preregistered on the OSF (DOI: 10.17605/OSF.IO/4FMY6) and on the Mexican national clinical registry [<xref ref-type="bibr" rid="ref30">30</xref>]. Both registrations are completed prior to prospective data collection.</p></sec><sec id="s2-15"><title>Timeline and Work Plan</title><p>Project timeline, methodological stages, and milestones for the development, validation, and implementation of the SCIM-III prediction model are shown in <xref ref-type="table" rid="table3">Table 3</xref>.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Timeline, work plan, and key milestones across project stages.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Stage</td><td align="left" valign="bottom">Dates</td><td align="left" valign="bottom">Activities</td><td align="left" valign="bottom">Milestone</td></tr></thead><tbody><tr><td align="left" valign="top">1</td><td align="left" valign="top">October 2025-June 2026</td><td align="left" valign="top">Data collection, anonymization, database structuring, descriptive and exploratory statistical analysis, and first technical report</td><td align="left" valign="top">Structured database</td></tr><tr><td align="left" valign="top">2</td><td align="left" valign="top">June 2026-March 2027</td><td align="left" valign="top">Development and training of ML<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup> models (regression, DT<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup>, ANN<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup>, and GPR)<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup>, k-fold cross-validation, model comparison, and congress presentation</td><td align="left" valign="top">Trained models+publication</td></tr><tr><td align="left" valign="top">3</td><td align="left" valign="top">June 2027-March 2028</td><td align="left" valign="top">External validation, digital application development, patent/IP registration, international congress (ASIA<sup><xref ref-type="table-fn" rid="table3fn5">e</xref></sup> 2027), and training workshop</td><td align="left" valign="top">Validated rule+app prototype</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>ML: machine learning.</p></fn><fn id="table3fn2"><p><sup>b</sup>DT: decision tree.</p></fn><fn id="table3fn3"><p><sup>c</sup>ANN: artificial neural network.</p></fn><fn id="table3fn4"><p><sup>d</sup>GPR: Gaussian process regression.</p></fn><fn id="table3fn5"><p><sup>e</sup>ASIA: American Spinal Injury Association.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-16"><title>Team</title><p>The multidisciplinary team comprises 10 researchers across 3 institutions (<xref ref-type="table" rid="table4">Table 4</xref>).</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Research team members, institutional affiliations, and project roles.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Name</td><td align="left" valign="bottom">Institution/specialty</td><td align="left" valign="bottom">Role</td></tr></thead><tbody><tr><td align="left" valign="top">Alberto Isaac P&#x00E9;rez-Sanpablo</td><td align="left" valign="top">INR LGII<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup>/biomedical engineering</td><td align="left" valign="top">Principal investigator</td></tr><tr><td align="left" valign="top">Jimena Quinza&#x00F1;os-Fresnedo</td><td align="left" valign="top">INR LGII/neurological rehabilitation</td><td align="left" valign="top">Coinvestigator</td></tr><tr><td align="left" valign="top">A&#x00ED;da Barrera-Ortiz</td><td align="left" valign="top">INR LGII/neurological rehabilitation</td><td align="left" valign="top">Coinvestigator</td></tr><tr><td align="left" valign="top">Marlene A Rodr&#x00ED;guez-Barrag&#x00E1;n</td><td align="left" valign="top">INR LGII/neurological rehabilitation</td><td align="left" valign="top">Coinvestigator</td></tr><tr><td align="left" valign="top">Fabiola Monserrat Palomino-Ramos</td><td align="left" valign="top">INR LGII/neurological rehabilitation</td><td align="left" valign="top">Coinvestigator</td></tr><tr><td align="left" valign="top">Alicia Meneses-Pe&#x00F1;aloza</td><td align="left" valign="top">INR LGII/pediatric rehabilitation</td><td align="left" valign="top">Coinvestigator</td></tr><tr><td align="left" valign="top">Oscar Prado-Escobar</td><td align="left" valign="top">INR LGII/rehabilitation medicine (resident)</td><td align="left" valign="top">Student Investigator</td></tr><tr><td align="left" valign="top">Marcela D Rodr&#x00ED;guez-Urrea</td><td align="left" valign="top">UABC<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup>/computer science</td><td align="left" valign="top">Coinvestigator (ML<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup>)</td></tr><tr><td align="left" valign="top">Irvin Hussein L&#x00F3;pez-Nava</td><td align="left" valign="top">CICESE<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup>/artificial intelligence</td><td align="left" valign="top">Coinvestigator (AI<sup><xref ref-type="table-fn" rid="table4fn5">e</xref></sup>)</td></tr><tr><td align="left" valign="top">Jos&#x00E9; Ambrosio-Basti&#x00E1;n</td><td align="left" valign="top">Independent/artificial intelligence</td><td align="left" valign="top">Coinvestigator (AI)</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>INR LGII: Instituto Nacional de Rehabilitaci&#x00F3;n Luis Guillermo Ibarra Ibarra.</p></fn><fn id="table4fn2"><p><sup>b</sup>UABC: Universidad Aut&#x00F3;noma de Baja California.</p></fn><fn id="table4fn3"><p><sup>c</sup>ML: machine learning.</p></fn><fn id="table4fn4"><p><sup>d</sup>CICESE: Centro de Investigaci&#x00F3;n Cient&#x00ED;fica y de Educaci&#x00F3;n Superior de Ensenada.</p></fn><fn id="table4fn5"><p><sup>e</sup>AI: artificial intelligence.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s3" sec-type="results"><title>Results</title><p>The study was funded by the Secretar&#x00ED;a de Ciencia, Humanidades, Tecnolog&#x00ED;a e Innovaci&#x00F3;n grant CBF-2025-I-3891 on October 29, 2025. The study was approved by the institutional research and ethics committees on October 21, 2025 (INRLGII 128/25). Researchers began retrospective data extraction from the institutional electronic clinical records system (records from January 2015 to June 2026) in October 2025. As of the submission of this manuscript in March 2026, researchers extracted and anonymized 119 retrospective patient records meeting eligibility criteria. Researchers are performing quality control and preprocessing of this data. Researchers plan to begin ML model development in June 2026 and expect to complete it by March 2027. Researchers plan to open enrollment of the external validation cohort (n=100) in October 2026 and close it in October 2027. External validation is planned between June 2027 and March 2028. Results of the development and validation study are expected to be submitted for publication in January 2028.</p></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings (Anticipated)</title><p>This protocol describes the development of the first ML-based predictive model for SCIM-III outcomes in a Mexican SCI cohort. We anticipate that including the ECT trunk control variable&#x2014;not captured by the standard ISNCSCI&#x2014;together with classic clinical variables (UEMS, LEMS, AIS, age, and time since injury) will meaningfully improve prediction accuracy over models based solely on neurological classification. Preliminary data from our group suggest that trunk control comprises a significant proportion of functional independence variance in this population [<xref ref-type="bibr" rid="ref9">9</xref>].</p><p>Comparative models, interpreted through SHAP analysis, will identify the optimal balance between predictive accuracy and clinical interpretability for trustworthy rehabilitation decision support.</p></sec><sec id="s4-2"><title>Comparison With Previous Work</title><p>Numerous studies have been conducted on predicting recovery in individuals with SCI [<xref ref-type="bibr" rid="ref31">31</xref>]. van Middendorp et al [<xref ref-type="bibr" rid="ref7">7</xref>] developed a clinical prediction rule based on age and clinical neurological parameters, such as motor and sensory assessments, to predict the long-term likelihood of independent walking, and Kaminski et al [<xref ref-type="bibr" rid="ref32">32</xref>] reported in 2017 that the 1-year functional outcome, as measured by the SCIM-III, can be estimated using a simple equation that considers four parameters from the initial physical examination. Similarly, predictive models based on ML have been developed to estimate the level of functionality in individuals from the acute stage, some using the Functional Independence Measure or the SCIM-III, concluding that it is possible to predict with good accuracy the gait and/or independence in activities of daily living [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]. Zhong et al [<xref ref-type="bibr" rid="ref35">35</xref>] conducted a systematic review and meta-analysis to evaluate the performance and quality of ML models in predicting SCI prognosis. The research indicated that ML models are significantly superior to traditional statistical models. This cutting-edge approach provides insights into how early prediction can be achieved using clinical characteristics at the time of patient admission.</p></sec><sec id="s4-3"><title>Limitations</title><p>As this is a retrospective design, we may encounter unavoidable biases and lack control over confounding variables. The sample size is small for ML, and the study was conducted at a single center, resulting in a good model but not universally reliable. Although researchers planned a two-stage imputation strategy and sensitivity analyses, we cannot fully exclude the possibility of residual bias from missing data. Also, the relatively small development sample may limit stability for high-capacity architectures (MLP and GPR) despite the proposed overfitting prevention strategies, and performance may degrade in populations with different case-mix profiles.</p><p>Also, participation (International Classification of Functioning, Disability, and Health) was not measured in this study. As of March 2026, no ML model has been effectively used to predict the prognosis of individuals with SCI in clinical practice. Greater interpretability of a model allows clinicians to better understand its predictive value and make clinical decisions that benefit individuals. Another limitation of our study is that it does not include biomarkers or advanced neuroimaging; however, in low-income countries, most centers lack the technology to perform these procedures in the acute phase. It is hoped that future research will continue to address this complex problem of model interpretability.</p></sec><sec id="s4-4"><title>Conclusions</title><p>Early prediction of functional independence recovery after SCI allows for the development of a rehabilitation strategy in patient management from the acute stage. Using ML, we aim to develop a tool that will enable us to identify key clinical predictors and provide a decision support system, thus predicting the degree of independence regained upon admission to an acute rehabilitation center. The protocol develops the first functional prediction tool for SCIs based on ML in Mexico, allowing for personalized rehabilitation planning and preparation for clinical application, laying the foundation for future research in SCI rehabilitation.</p></sec></sec></body><back><ack><p>The authors acknowledge the valuable collaboration of physicians, engineers, and researchers from different Mexican institutions who made this work possible. The authors also thank the Instituto Nacional de Rehabilitaci&#x00F3;n Luis Guillermo Ibarra Ibarra for providing the resources and facilities necessary to carry out this research. Finally, the authors are grateful to colleagues whose comments and suggestions contributed to improving the quality of this manuscript. The authors declare the use of generative AI (GenAI) in the research and writing process. According to the GAIDeT taxonomy (2025), the following tasks were delegated to GenAI tools under full human supervision: proofreading and editing, summarizing text, translation, reformatting, quality assessment, and publication support. The GenAI tool used was ChatGPT-5.3 and Claude Sonnet 4.6. Responsibility for the final manuscript lies entirely with the authors. GenAI tools are not listed as authors and do not bear responsibility for the final outcomes.</p><p>Declaration submitted by: collective responsibility</p></ack><notes><sec><title>Funding</title><p>This study was funded by Secretar&#x00ED;a de Ciencia, Humanidades, Tecnolog&#x00ED;a e Innovaci&#x00F3;n grant CBF-2025-I-3891 on October 29, 2025; the funder had no role in the study design, data collection, analysis and interpretation of the data, manuscript preparation, or the decision to publish the results.</p></sec><sec><title>Data Availability</title><p>The data used in this study include anonymized clinical information. Due to the nature of this data, the original dataset is not publicly available; however, it may be requested from the corresponding author, subject to approval by the appropriate ethics committees and compliance with data protection regulations. Researchers will release a synthetic dataset with a data dictionary (variable definitions, coding, units, and missingness patterns) on Open Science Framework (OSF; CC-BY 4.0) and analysis code on GitHub (MIT license), implemented in Python 3.10+ with scikit-learn 1.4, LightGBM 4.3, CatBoost 1.2, TensorFlow 2.15, and GPyTorch 1.11 upon publication of the article. The authors have taken the necessary measures to ensure data anonymization and compliance with applicable ethical and legal standards.</p><p>This study is preregistered on the OSF (DOI: 10.17605/OSF.IO/4FMY6) and on the Mexican national clinical registry [<xref ref-type="bibr" rid="ref30">30</xref>]. Both registrations are completed prior to prospective data collection.</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization: AIP-S, JQ-F</p><p>Methodology: AIP-S, JQ-F, MAR-B, MDR, IHL-N, JA-B</p><p>Funding acquisition: AIP-S</p><p>Project administration: AIP-S</p><p>Data acquisition: AB-O, MAR-B, FMP-R, AM-P, OP-E (student investigator)</p><p>Clinical expertise: JQ-F, AB-O, FMP-R, AM-P</p><p>Software: MDR, IHL-N, JA-B</p><p>Writing (original draft): AIP-S</p><p>Critical review: JQ-F, AB-O, MAR-B, FMP-R, AM-P, MDR, IHL-N, JA-B.</p><p>All authors read and approved the final manuscript.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AIS </term><def><p>American Spinal Injury Association Impairment Scale</p></def></def-item><def-item><term id="abb2">AUC </term><def><p>area under the curve</p></def></def-item><def-item><term id="abb3">CART</term><def><p>classification and regression tree</p></def></def-item><def-item><term id="abb4">CatBoost </term><def><p>categorical boosting</p></def></def-item><def-item><term id="abb5">ECT </term><def><p>Trunk Control Scale (Escala de Control de Tronco)</p></def></def-item><def-item><term id="abb6">GPR</term><def><p>Gaussian process regression</p></def></def-item><def-item><term id="abb7">INR LGII </term><def><p>Instituto Nacional de Rehabilitaci&#x00F3;n Luis Guillermo Ibarra Ibarra</p></def></def-item><def-item><term id="abb8">ISNCSCI</term><def><p>International Standards for Neurological Classification of Spinal Cord Injury</p></def></def-item><def-item><term id="abb9">LEMS</term><def><p>Lower Extremity Motor Score</p></def></def-item><def-item><term id="abb10">LightGBM</term><def><p>light gradient boosting machine</p></def></def-item><def-item><term id="abb11">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb12">MLP </term><def><p>multilayer perceptron</p></def></def-item><def-item><term id="abb13">MRI</term><def><p>magnetic resonance imaging</p></def></def-item><def-item><term id="abb14">OSF </term><def><p>Open Science Framework</p></def></def-item><def-item><term id="abb15">PCA</term><def><p>principal component analysis</p></def></def-item><def-item><term id="abb16">RMSE</term><def><p>root-mean-square error</p></def></def-item><def-item><term id="abb17">SCI</term><def><p>spinal cord injury</p></def></def-item><def-item><term id="abb18">SCIM-III </term><def><p>Spinal Cord Independence Measure, version III</p></def></def-item><def-item><term id="abb19">SHAP</term><def><p>Shapley additive explanations</p></def></def-item><def-item><term id="abb20">UEMS</term><def><p>Upper Extremity Motor Score</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wade</surname><given-names>DT</given-names> </name></person-group><article-title>Goal setting in rehabilitation: an overview of what, why and how</article-title><source>Clin Rehabil</source><year>2009</year><volume>23</volume><issue>4</issue><fpage>291</fpage><lpage>295</lpage><pub-id pub-id-type="doi">10.1177/0269215509103551</pub-id><pub-id pub-id-type="medline">19293289</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Maribo</surname><given-names>T</given-names> </name><name name-style="western"><surname>Jensen</surname><given-names>CM</given-names> </name><name name-style="western"><surname>Madsen</surname><given-names>LS</given-names> </name><name name-style="western"><surname>Handberg</surname><given-names>C</given-names> </name></person-group><article-title>Experiences with and perspectives on goal setting in spinal cord injury rehabilitation: a systematic review of qualitative studies</article-title><source>Spinal Cord</source><year>2020</year><volume>58</volume><issue>9</issue><fpage>949</fpage><lpage>958</lpage><pub-id pub-id-type="doi">10.1038/s41393-020-0485-8</pub-id><pub-id pub-id-type="medline">32424174</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kirshblum</surname><given-names>S</given-names> </name><name name-style="western"><surname>Snider</surname><given-names>B</given-names> </name><name name-style="western"><surname>Eren</surname><given-names>F</given-names> </name><name name-style="western"><surname>Guest</surname><given-names>J</given-names> </name></person-group><article-title>Characterizing natural recovery after traumatic spinal cord Injury</article-title><source>J Neurotrauma</source><year>2021</year><volume>38</volume><issue>9</issue><fpage>1267</fpage><lpage>1284</lpage><pub-id pub-id-type="doi">10.1089/neu.2020.7473</pub-id><pub-id pub-id-type="medline">33339474</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Boyles</surname><given-names>RH</given-names> </name><name name-style="western"><surname>Alexander</surname><given-names>CM</given-names> </name><name name-style="western"><surname>Belsi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Strutton</surname><given-names>PH</given-names> </name></person-group><article-title>Are clinical prediction rules used in spinal cord injury care? A survey of practice</article-title><source>Top Spinal Cord Inj Rehabil</source><year>2024</year><volume>30</volume><issue>1</issue><fpage>45</fpage><lpage>58</lpage><pub-id pub-id-type="doi">10.46292/sci23-00069</pub-id><pub-id pub-id-type="medline">38433737</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wilson</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Cadotte</surname><given-names>DW</given-names> </name><name name-style="western"><surname>Fehlings</surname><given-names>MG</given-names> </name></person-group><article-title>Clinical predictors of neurological outcome, functional status, and survival after traumatic spinal cord injury: a systematic review</article-title><source>SPI</source><year>2012</year><volume>17</volume><issue>Suppl1</issue><fpage>11</fpage><lpage>26</lpage><pub-id pub-id-type="doi">10.3171/2012.4.AOSPINE1245</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hicks</surname><given-names>KE</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Fallah</surname><given-names>N</given-names> </name><etal/></person-group><article-title>A simplified clinical prediction rule for prognosticating independent walking after spinal cord injury</article-title><source>Spine J</source><year>2017</year><volume>17</volume><issue>10</issue><fpage>1383</fpage><lpage>1392</lpage><pub-id pub-id-type="doi">10.1016/j.spinee.2017.05.031</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>van Middendorp</surname><given-names>JJ</given-names> </name><name name-style="western"><surname>Hosman</surname><given-names>AJF</given-names> </name><name name-style="western"><surname>Donders</surname><given-names>ART</given-names> </name><etal/></person-group><article-title>A clinical prediction rule for ambulation outcomes after traumatic spinal cord injury: a longitudinal cohort study</article-title><source>Lancet</source><year>2011</year><volume>377</volume><issue>9770</issue><fpage>1004</fpage><lpage>1010</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(10)62276-3</pub-id><pub-id pub-id-type="medline">21377202</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hori</surname><given-names>T</given-names> </name><name name-style="western"><surname>Imura</surname><given-names>T</given-names> </name><name name-style="western"><surname>Tanaka</surname><given-names>R</given-names> </name></person-group><article-title>Development of a clinical prediction rule for patients with cervical spinal cord injury who have difficulty in obtaining independent living</article-title><source>Spine J</source><year>2022</year><volume>22</volume><issue>2</issue><fpage>321</fpage><lpage>328</lpage><pub-id pub-id-type="doi">10.1016/j.spinee.2021.08.010</pub-id><pub-id pub-id-type="medline">34487911</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sperling</surname><given-names>J</given-names> </name><name name-style="western"><surname>Welsh</surname><given-names>W</given-names> </name><name name-style="western"><surname>Haseley</surname><given-names>E</given-names> </name><etal/></person-group><article-title>Machine learning-based prediction models in medical decision-making in kidney disease: patient, caregiver, and clinician perspectives on trust and appropriate use</article-title><source>J Am Med Inform Assoc</source><year>2025</year><volume>32</volume><issue>1</issue><fpage>51</fpage><lpage>62</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocae255</pub-id><pub-id pub-id-type="medline">39545362</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Arora</surname><given-names>M</given-names> </name><name name-style="western"><surname>Craig</surname><given-names>AR</given-names> </name></person-group><article-title>Special issue-spinal cord injuries: advances in rehabilitation</article-title><source>J Clin Med</source><year>2024</year><volume>13</volume><issue>6</issue><fpage>1782</fpage><pub-id pub-id-type="doi">10.3390/jcm13061782</pub-id><pub-id pub-id-type="medline">38542004</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mahanes</surname><given-names>D</given-names> </name><name name-style="western"><surname>Muehlschlegel</surname><given-names>S</given-names> </name><name name-style="western"><surname>Wartenberg</surname><given-names>KE</given-names> </name><etal/></person-group><article-title>Guidelines for neuroprognostication in adults with traumatic spinal cord injury</article-title><source>Neurocrit Care</source><year>2024</year><volume>40</volume><issue>2</issue><fpage>415</fpage><lpage>437</lpage><pub-id pub-id-type="doi">10.1007/s12028-023-01845-8</pub-id><pub-id pub-id-type="medline">37957419</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Scivoletto</surname><given-names>G</given-names> </name><name name-style="western"><surname>Tamburella</surname><given-names>F</given-names> </name><name name-style="western"><surname>Laurenza</surname><given-names>L</given-names> </name><name name-style="western"><surname>Torre</surname><given-names>M</given-names> </name><name name-style="western"><surname>Molinari</surname><given-names>M</given-names> </name></person-group><article-title>Who is going to walk? A review of the factors influencing walking recovery after spinal cord injury</article-title><source>Front Hum Neurosci</source><year>2014</year><volume>8</volume><fpage>141</fpage><pub-id pub-id-type="doi">10.3389/fnhum.2014.00141</pub-id><pub-id pub-id-type="medline">24659962</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Quinza&#x00F1;os-Fresnedo</surname><given-names>J</given-names> </name><name name-style="western"><surname>Fratini-Escobar</surname><given-names>PC</given-names> </name><name name-style="western"><surname>Almaguer-Benavides</surname><given-names>KM</given-names> </name><etal/></person-group><article-title>Prognostic validity of a clinical trunk control test for independence and walking in individuals with spinal cord injury</article-title><source>J Spinal Cord Med</source><year>2020</year><volume>43</volume><issue>3</issue><fpage>331</fpage><lpage>338</lpage><pub-id pub-id-type="doi">10.1080/10790268.2018.1518124</pub-id><pub-id pub-id-type="medline">30207875</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>H&#x00E5;kansson</surname><given-names>S</given-names> </name><name name-style="western"><surname>Tuci</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bolliger</surname><given-names>M</given-names> </name><name name-style="western"><surname>Curt</surname><given-names>A</given-names> </name><name name-style="western"><surname>Jutzeler</surname><given-names>CR</given-names> </name><name name-style="western"><surname>Br&#x00FC;ningk</surname><given-names>SC</given-names> </name></person-group><article-title>Data-driven prediction of spinal cord injury recovery: an exploration of current status and future perspectives</article-title><source>Exp Neurol</source><year>2024</year><volume>380</volume><fpage>114913</fpage><pub-id pub-id-type="doi">10.1016/j.expneurol.2024.114913</pub-id><pub-id pub-id-type="medline">39097073</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sharif</surname><given-names>S</given-names> </name><name name-style="western"><surname>Jazaib Ali</surname><given-names>MY</given-names> </name></person-group><article-title>Outcome prediction in spinal cord injury: myth or reality</article-title><source>World Neurosurg</source><year>2020</year><volume>140</volume><fpage>574</fpage><lpage>590</lpage><pub-id pub-id-type="doi">10.1016/j.wneu.2020.05.043</pub-id><pub-id pub-id-type="medline">32437998</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Catz</surname><given-names>A</given-names> </name><name name-style="western"><surname>Itzkovich</surname><given-names>M</given-names> </name><name name-style="western"><surname>Tesio</surname><given-names>L</given-names> </name><etal/></person-group><article-title>A multicenter international study on the Spinal Cord Independence Measure, version III (SCIM III)</article-title><source>Disabil Rehabil</source><year>2007</year><volume>29</volume><issue>24</issue><fpage>1926</fpage><lpage>1933</lpage><pub-id pub-id-type="doi">10.1080/09638280601055052</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Rasmussen</surname><given-names>CE</given-names> </name><name name-style="western"><surname>Williams</surname><given-names>CKI</given-names> </name></person-group><source>Gaussian Processes for Machine Learning</source><year>2006</year><publisher-name>MIT Press</publisher-name><pub-id pub-id-type="doi">10.7551/mitpress/3206.001.0001</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>P&#x00E9;rez-Sanpablo</surname><given-names>AI</given-names> </name><name name-style="western"><surname>Quinza&#x00F1;os-Fresnedo</surname><given-names>J</given-names> </name><name name-style="western"><surname>Romero-Ixtla</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Validation of inertial measurement units for the assessment of trunk control in subjects with spinal cord injury</article-title><source>J Spinal Cord Med</source><year>2023</year><volume>46</volume><issue>1</issue><fpage>154</fpage><lpage>163</lpage><pub-id pub-id-type="doi">10.1080/10790268.2021.1975083</pub-id><pub-id pub-id-type="medline">34612796</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>AlHuthaifi</surname><given-names>F</given-names> </name><name name-style="western"><surname>Krzak</surname><given-names>J</given-names> </name><name name-style="western"><surname>Hanke</surname><given-names>T</given-names> </name><name name-style="western"><surname>Vogel</surname><given-names>LC</given-names> </name></person-group><article-title>Predictors of functional outcomes in adults with traumatic spinal cord injury following inpatient rehabilitation: a systematic review</article-title><source>J Spinal Cord Med</source><year>2017</year><volume>40</volume><issue>3</issue><fpage>282</fpage><lpage>294</lpage><pub-id pub-id-type="doi">10.1080/10790268.2016.1238184</pub-id><pub-id pub-id-type="medline">27852160</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="web"><article-title>Instituto Nacional de Rehabilitaci&#x00F3;n luis guillermo ibarra ibarra informe de autoevaluaci&#x00F3;n 2024</article-title><source>Instituto Nacional de Rehabilitaci&#x00F3;n</source><year>2024</year><access-date>2026-11-03</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.inr.gob.mx/Descargas/informes/Informe_Autoevaluacion_2024.pdf">https://www.inr.gob.mx/Descargas/informes/Informe_Autoevaluacion_2024.pdf</ext-link></comment></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tsegaye</surname><given-names>B</given-names> </name><name name-style="western"><surname>Snell</surname><given-names>KIE</given-names> </name><name name-style="western"><surname>Archer</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Larger sample sizes are needed when developing a clinical prediction model using machine learning in oncology: methodological systematic review</article-title><source>J Clin Epidemiol</source><year>2025</year><volume>180</volume><fpage>111675</fpage><pub-id pub-id-type="doi">10.1016/j.jclinepi.2025.111675</pub-id><pub-id pub-id-type="medline">39814217</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>van Smeden</surname><given-names>M</given-names> </name><name name-style="western"><surname>Moons</surname><given-names>KG</given-names> </name><name name-style="western"><surname>de Groot</surname><given-names>JA</given-names> </name><etal/></person-group><article-title>Sample size for binary logistic prediction models: beyond events per variable criteria</article-title><source>Stat Methods Med Res</source><year>2019</year><volume>28</volume><issue>8</issue><fpage>2455</fpage><lpage>2474</lpage><pub-id pub-id-type="doi">10.1177/0962280218784726</pub-id><pub-id pub-id-type="medline">29966490</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>van der Ploeg</surname><given-names>T</given-names> </name><name name-style="western"><surname>Austin</surname><given-names>PC</given-names> </name><name name-style="western"><surname>Steyerberg</surname><given-names>EW</given-names> </name></person-group><article-title>Modern modelling techniques are data hungry: a simulation study for predicting dichotomous endpoints</article-title><source>BMC Med Res Methodol</source><year>2014</year><volume>14</volume><fpage>137</fpage><pub-id pub-id-type="doi">10.1186/1471-2288-14-137</pub-id><pub-id pub-id-type="medline">25532820</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Riley</surname><given-names>RD</given-names> </name><name name-style="western"><surname>Snell</surname><given-names>KIE</given-names> </name><name name-style="western"><surname>Ensor</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Minimum sample size for developing a multivariable prediction model: part I - continuous outcomes</article-title><source>Stat Med</source><year>2019</year><volume>38</volume><issue>7</issue><fpage>1262</fpage><lpage>1275</lpage><pub-id pub-id-type="doi">10.1002/sim.7993</pub-id><pub-id pub-id-type="medline">30347470</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Goldenholz</surname><given-names>DM</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>H</given-names> </name><name name-style="western"><surname>Ganglberger</surname><given-names>W</given-names> </name><name name-style="western"><surname>Westover</surname><given-names>MB</given-names> </name></person-group><article-title>Sample size analysis for machine learning clinical validation studies</article-title><source>Biomedicines</source><year>2023</year><volume>11</volume><issue>3</issue><fpage>685</fpage><pub-id pub-id-type="doi">10.3390/biomedicines11030685</pub-id><pub-id pub-id-type="medline">36979665</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zantvoort</surname><given-names>K</given-names> </name><name name-style="western"><surname>Hentati Isacsson</surname><given-names>N</given-names> </name><name name-style="western"><surname>Funk</surname><given-names>B</given-names> </name><name name-style="western"><surname>Kaldo</surname><given-names>V</given-names> </name></person-group><article-title>Dataset size versus homogeneity: a machine learning study on pooling intervention data in e-mental health dropout predictions</article-title><source>Digit Health</source><year>2024</year><volume>10</volume><fpage>20552076241248920</fpage><pub-id pub-id-type="doi">10.1177/20552076241248920</pub-id><pub-id pub-id-type="medline">38757087</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ramspek</surname><given-names>CL</given-names> </name><name name-style="western"><surname>Jager</surname><given-names>KJ</given-names> </name><name name-style="western"><surname>Dekker</surname><given-names>FW</given-names> </name><name name-style="western"><surname>Zoccali</surname><given-names>C</given-names> </name><name name-style="western"><surname>van Diepen</surname><given-names>M</given-names> </name></person-group><article-title>External validation of prognostic models: what, why, how, when and where?</article-title><source>Clin Kidney J</source><year>2021</year><volume>14</volume><issue>1</issue><fpage>49</fpage><lpage>58</lpage><pub-id pub-id-type="doi">10.1093/ckj/sfaa188</pub-id><pub-id pub-id-type="medline">33564405</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lundberg</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>SI</given-names> </name></person-group><article-title>A unified approach to interpreting model predictions</article-title><source>Adv Neural Inf Process Syst</source><year>2017</year><volume>30</volume><fpage>4765</fpage><lpage>4774</lpage></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="web"><article-title>Norma Oficial Mexicana NOM-012-SSA3-2012, que establece los criterios para la ejecuci&#x00F3;n de proyectos de investigaci&#x00F3;n en seres humanos</article-title><source>Secretar&#x00ED;a de salud</source><year>2013</year><access-date>2026-11-03</access-date><publisher-name>Diario Oficial de la Federaci&#x00F3;n</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.dof.gob.mx/nota_detalle.php?codigo=5284149&#x0026;fecha=04/01/2013">https://www.dof.gob.mx/nota_detalle.php?codigo=5284149&#x0026;fecha=04/01/2013</ext-link></comment></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="web"><source>Estudios Cl&#x00ED;nicos</source><access-date>2026-06-05</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://estudiosclinicos.salud.gob.mx/">https://estudiosclinicos.salud.gob.mx/</ext-link></comment></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yoo</surname><given-names>HJ</given-names> </name><name name-style="western"><surname>Koo</surname><given-names>B</given-names> </name><name name-style="western"><surname>Yong</surname><given-names>CW</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>KS</given-names> </name></person-group><article-title>Prediction of gait recovery using machine learning algorithms in patients with spinal cord injury</article-title><source>Medicine (Baltimore)</source><year>2024</year><volume>103</volume><issue>23</issue><fpage>e38286</fpage><pub-id pub-id-type="doi">10.1097/MD.0000000000038286</pub-id><pub-id pub-id-type="medline">38847729</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kaminski</surname><given-names>L</given-names> </name><name name-style="western"><surname>Cordemans</surname><given-names>V</given-names> </name><name name-style="western"><surname>Cernat</surname><given-names>E</given-names> </name><name name-style="western"><surname>M&#x2019;Bra</surname><given-names>KI</given-names> </name><name name-style="western"><surname>Mac-Thiong</surname><given-names>JM</given-names> </name></person-group><article-title>Functional outcome prediction after traumatic spinal cord injury based on acute clinical factors</article-title><source>J Neurotrauma</source><year>2017</year><volume>34</volume><issue>12</issue><fpage>2027</fpage><lpage>2033</lpage><pub-id pub-id-type="doi">10.1089/neu.2016.4955</pub-id><pub-id pub-id-type="medline">28129730</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Facchinello</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Beaus&#x00E9;jour</surname><given-names>M</given-names> </name><name name-style="western"><surname>Richard-Denis</surname><given-names>A</given-names> </name><name name-style="western"><surname>Thompson</surname><given-names>C</given-names> </name><name name-style="western"><surname>Mac-Thiong</surname><given-names>JM</given-names> </name></person-group><article-title>Use of regression tree analysis for predicting the functional outcome after traumatic spinal cord injury</article-title><source>J Neurotrauma</source><year>2021</year><volume>38</volume><issue>9</issue><fpage>1285</fpage><lpage>1291</lpage><pub-id pub-id-type="doi">10.1089/neu.2020.7594</pub-id><pub-id pub-id-type="medline">29065782</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kato</surname><given-names>C</given-names> </name><name name-style="western"><surname>Uemura</surname><given-names>O</given-names> </name><name name-style="western"><surname>Sato</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Tsuji</surname><given-names>T</given-names> </name></person-group><article-title>Functional outcome prediction after spinal cord injury using ensemble machine learning</article-title><source>Arch Phys Med Rehabil</source><year>2024</year><volume>105</volume><issue>1</issue><fpage>95</fpage><lpage>100</lpage><pub-id pub-id-type="doi">10.1016/j.apmr.2023.08.011</pub-id><pub-id pub-id-type="medline">37714506</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhong</surname><given-names>L</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Predicting spinal cord injury prognosis using machine learning: systematic review and meta-analysis</article-title><source>JMIR AI</source><year>2025</year><volume>4</volume><fpage>e66233</fpage><pub-id pub-id-type="doi">10.2196/66233</pub-id><pub-id pub-id-type="medline">41348848</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Peer Review Report 1</label><p>Peer review report by Secretar&#x00ED;a de Ciencia, Humanidades, Tecnolog&#x00ED;a e Innovaci&#x00F3;n (SECIHTI, Mexico)</p><media xlink:href="resprot_v15i1e95236_app1.pdf" xlink:title="PDF File, 1485 KB"/></supplementary-material></app-group></back></article>