<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Res Protoc</journal-id><journal-id journal-id-type="publisher-id">ResProt</journal-id><journal-id journal-id-type="index">5</journal-id><journal-title>JMIR Research Protocols</journal-title><abbrev-journal-title>JMIR Res Protoc</abbrev-journal-title><issn pub-type="epub">1929-0748</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v14i1e73040</article-id><article-id pub-id-type="doi">10.2196/73040</article-id><article-categories><subj-group subj-group-type="heading"><subject>Protocol</subject></subj-group></article-categories><title-group><article-title>Evaluating Diversity in Open Photoplethysmography Datasets: Protocol for a Systematic Review</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes" equal-contrib="yes"><name name-style="western"><surname>Penmetcha</surname><given-names>Vedha</given-names></name><degrees>BA</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Rambabu</surname><given-names>Lekaashree</given-names></name><degrees>BSc, MRES, MBChB</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="aff" rid="aff5">5</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Smith</surname><given-names>Brandon G</given-names></name><degrees>BSc, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff6">6</xref><xref ref-type="aff" rid="aff7">7</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Mantle</surname><given-names>Orla</given-names></name><degrees>MBBS, MPhil</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff7">7</xref><xref ref-type="aff" rid="aff8">8</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Edmiston</surname><given-names>Thomas</given-names></name><degrees>BChir, MB</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Hobbs</surname><given-names>Laura</given-names></name><degrees>BChir, MB</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff7">7</xref><xref ref-type="aff" rid="aff9">9</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Nagraj</surname><given-names>Shobhana</given-names></name><degrees>MBBS, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff6">6</xref><xref ref-type="aff" rid="aff7">7</xref><xref ref-type="aff" rid="aff10">10</xref><xref ref-type="aff" rid="aff11">11</xref><xref ref-type="aff" rid="aff12">12</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Charlton</surname><given-names>Peter H</given-names></name><degrees>MEng, PhD</degrees><xref ref-type="aff" rid="aff11">11</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Bashford</surname><given-names>Tom</given-names></name><degrees>MBBS, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="aff" rid="aff6">6</xref><xref ref-type="aff" rid="aff7">7</xref></contrib></contrib-group><aff id="aff1"><institution>International Health Systems Group, Department of Engineering, University of Cambridge</institution><addr-line>Cambridge</addr-line><country>United Kingdom</country></aff><aff id="aff2"><institution>Department of Kinesiology, Wiess School of Natural Sciences, Rice University</institution><addr-line>6360 Main St</addr-line><addr-line>Houston</addr-line><addr-line>TX</addr-line><country>United States</country></aff><aff id="aff3"><institution>Department of Medicine, University of Cambridge</institution><addr-line>Cambridge</addr-line><country>United Kingdom</country></aff><aff id="aff4"><institution>Department of Anaesthesia, Cambridge University Hospitals NHS Foundation Trust</institution><addr-line>Cambridge</addr-line><country>United Kingdom</country></aff><aff id="aff5"><institution>Accelerate Programme for Scientific Discovery, Department of Computer Science and Technology, University of Cambridge</institution><addr-line>Cambridge</addr-line><country>United Kingdom</country></aff><aff id="aff6"><institution>Cambridge Public Health Interdisciplinary Research Centre, University of Cambridge</institution><addr-line>Cambridge</addr-line><country>United Kingdom</country></aff><aff id="aff7"><institution>NIHR Global Health Research Group on Acquired Brain and Spine Injury (ABSI), University of Cambridge</institution><addr-line>Cambridge</addr-line><country>United Kingdom</country></aff><aff id="aff8"><institution>GKT School of Medical Education, King's College London</institution><addr-line>London</addr-line><country>United Kingdom</country></aff><aff id="aff9"><institution>Department of Anaesthesia, East and North Hertfordshire Teaching NHS Trust</institution><addr-line>Stevenage</addr-line><country>United Kingdom</country></aff><aff id="aff10"><institution>East London NHS Foundation Trust</institution><addr-line>London</addr-line><country>United Kingdom</country></aff><aff id="aff11"><institution>Department of Public Health and Primary Care, University of Cambridge</institution><addr-line>Cambridge</addr-line><country>United Kingdom</country></aff><aff id="aff12"><institution>Nuffield Department of Women&#x2019;s and Reproductive Health, University of Oxford</institution><addr-line>Oxford</addr-line><country>United Kingdom</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Schwartz</surname><given-names>Amy</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Laws</surname><given-names>Elinor</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Vedha Penmetcha, BA, Department of Kinesiology, Wiess School of Natural Sciences, Rice University, 6360 Main St, Houston, TX, 77005, United States, 1 9133049350; <email>vp439@cam.ac.uk</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>1</day><month>10</month><year>2025</year></pub-date><volume>14</volume><elocation-id>e73040</elocation-id><history><date date-type="received"><day>28</day><month>02</month><year>2025</year></date><date date-type="rev-recd"><day>21</day><month>07</month><year>2025</year></date><date date-type="accepted"><day>10</day><month>09</month><year>2025</year></date></history><copyright-statement>&#x00A9; Vedha Penmetcha, Lekaashree Rambabu, Brandon G Smith, Orla Mantle, Thomas Edmiston, Laura Hobbs, Shobhana Nagraj, Peter H Charlton, Tom Bashford. Originally published in JMIR Research Protocols (<ext-link ext-link-type="uri" xlink:href="https://www.researchprotocols.org">https://www.researchprotocols.org</ext-link>), 1.10.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Research Protocols, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.researchprotocols.org">https://www.researchprotocols.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://www.researchprotocols.org/2025/1/e73040"/><abstract><sec><title>Background</title><p>Photoplethysmography (PPG) is an optical method for measuring blood volume changes in microcirculation through noninvasive photodetection. It has become a widespread and essential clinical tool, used in pulse oximeters and wearable devices. However, technical aspects of PPG make it susceptible to intrinsic bias, with the potential to adversely affect particular patient and consumer populations. Developments in PPG technology, increasingly driven by openly accessible datasets as opposed to de novo experimentation, have the potential to help monitor an array of physiological variables. However, some populations may be underrepresented in PPG datasets. We describe a protocol for a systematic review to assess the biases within open access PPG datasets.</p></sec><sec><title>Objective</title><p>This review aims to evaluate the underlying reporting patterns and structure of openly accessible PPG datasets. We will provide insight into the measured biosignals and demographic variables included in the datasets in the hope of shedding light on what PPG data parameters are being used to develop medical devices. Therefore, we can elucidate current gaps and areas for improvement to reduce bias in medical device development.</p></sec><sec sec-type="methods"><title>Methods</title><p>This review will be reported in accordance with the standard PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) guidelines. We will include primary studies that mention PPG and specifically reference openly accessible datasets since 2000. The datasets must contain physiological parameters such as heart rate, blood pressure, or respiratory rate, as well as the PPG waveform data, collected from humans. Searches will be conducted in literature databases and data repositories, including MedLine OVID, IEEE Xplore, Scopus, and PhysioNet. Studies will be evaluated in accordance with the Standing Together Initiative recommendations, which are urging for health care technologies supported by representative data. Biosignal and demographic variables will be extracted from the PPG datasets, with steps taken to harmonize and store this information. Statistical analysis will be performed, including descriptive statistics and the chi-square test for comparisons. Additional statistical analyses will be performed after data extraction is completed and the level of heterogeneity is characterized.</p></sec><sec sec-type="results"><title>Results</title><p>We will analyze the dataset diversity and the structural basis of PPG datasets. This includes statistically analyzing the demographic and biosignal variables in the datasets. By using statistical test fit for nominal variable comparisons, we will evaluate the frequencies of characteristics like the devices used, biosignals collected, clinical parameters, demographic characteristics, and geographic information. This systematic review is expected to be completed by September 2025. The screening and review of the articles is currently being conducted.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This review will provide insight into the potential gaps of existing open access PPG datasets. It will inform future data collection and design of openly available PPG datasets for training medical devices, including wearables, to avoid perpetuating biases, allowing for application in diverse clinical settings.</p></sec><sec><title>Trial Registration</title><p>PROSPERO CRD42024564759; https://www.crd.york.ac.uk/PROSPERO/view/CRD42024564759</p></sec><sec sec-type="registered-report"><title>International Registered Report Identifier (IRRID)</title><p>PRR1-10.2196/73040</p></sec></abstract><kwd-group><kwd>photoplethysmography</kwd><kwd>PPG</kwd><kwd>open data</kwd><kwd>diversity</kwd><kwd>skin tone</kwd><kwd>bias</kwd><kwd>equity</kwd><kwd>fairness</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Photoplethysmography (PPG) is an optical method for measuring blood volume changes in microcirculation, through noninvasive photodetection. It has become a widespread and essential tool, providing the sensing technology for pulse oximeters in clinical use and being widely used in consumer wearables such as smartwatches for heart rate monitoring. However, technical aspects of PPG make it susceptible to intrinsic bias, with the potential to adversely affect particular patient and consumer populations. Developments in PPG technology, increasingly driven by existing datasets as opposed to de novo experimentation, have the potential to help monitor an array of physiological variables with both clinical and wellness applications. However, these may disenfranchise those populations who are underrepresented in the existing training datasets.</p><p>PPG waveforms depict blood volume changes due to changes in absorption and reflection patterns detected by the photodetector [<xref ref-type="bibr" rid="ref1">1</xref>]. PPG measurements are usually obtained by placing the device on the extremities of the body where the vascular bed is shallow and widespread [<xref ref-type="bibr" rid="ref2">2</xref>]. These locations can include the wrist, fingers, toes, and ears. Through signal processing, and in some cases the use of different wavelengths of light, PPG can provide information on respiratory rate, blood pressure, sleep patterns, arterial stiffness, and blood oxygen saturation [<xref ref-type="bibr" rid="ref3">3</xref>]. In addition, the periodicity of electrocardiogram and PPG waves can be correlated in terms of heart rate variability and arrhythmias, as the waveforms correlate to specific points within the cardiac cycle [<xref ref-type="bibr" rid="ref4">4</xref>].</p><p>The 2 primary components of a PPG waveform consist of the pulsatile and the lower frequency portions. The pulsatile component directly correlates to the volumetric changes associated with the heart rate [<xref ref-type="bibr" rid="ref5">5</xref>]. The lower frequency component, on the other hand, consists of the light absorbed by the tissue, veins, and blood, which correlates to volume capacity [<xref ref-type="bibr" rid="ref5">5</xref>]. The optical measurements are usually taken at red or near-infrared wavelengths (625 nm-750 nm and 750 nm-1400 nm) or green wavelengths (500&#x2010;565 nm) [<xref ref-type="bibr" rid="ref6">6</xref>]. These are commonly used because the red or near-infrared wavelengths penetrate up to 2 cm beyond the skin surface whereas the green penetrates up to 0.3 mm and allows for the differentiation between oxyhemoglobin and deoxyhemoglobin [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref9">9</xref>]. However, some PPG methods include the use of multiple wavelengths, including blue, green, and yellow light to improve the signal-to-noise ratio [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>].</p><p>PPG, along with pulse oximetry, has limitations attributed to motion, ambient light, sensor contact, pulse pressure reduction, and disturbances in contact between the sensor and the skin. One key limitation that has recently been highlighted is that of inaccuracy across different skin tones [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. Sjoding et al recently reported that black patients had almost 3 times the frequency of occult hypoxia&#x2013;falsely elevated oxygen saturation levels&#x2013;compared to their white counterparts [<xref ref-type="bibr" rid="ref14">14</xref>]. Occult hypoxia can lead to higher risk of mortality and organ failure for darker-skinned patients and has been shown to reduce the provision of life-saving treatment modalities like supplemental oxygen and medications. This is clearly of concern, both due to the limitations of clinical devices but also the biases inherent in commercial health technology which systematically underserve select populations. The reduced performance of PPG-based technology on darker-skin-toned and obese patients necessitates further inclusion of demographic characteristics like skin tone, race or ethnicity, and even BMI in PPG datasets used to train medical devices, like pulse oximeters. Furthermore, as continuous clinical monitoring and the availability of wearable technology increases globally without correctional strategies, these biases will only worsen the performance of medical devices on diverse populations.</p><p>While the original experiments in pulse oximetry involved permissive hypoxia of test subjects, a number of current PPG developments are largely driven by training on available datasets. However, the biases within openly available datasets have not been described. This makes it difficult to understand their possible impact on both clinical and consumer technology. We describe a protocol for the first systematic review of which we are aware designed to assess the biases within currently open access PPG datasets. This has immediate value for those seeking to derive physiological data from PPG technology using training datasets. By focusing on openly accessible datasets and repositories, we will provide insight into the demographic characteristics of the data that is commonly used for a majority of existing PPG technology including wearables.</p><p>This review aims to evaluate the underlying reporting patterns and structure of openly accessible PPG datasets. We will provide insight into the measured biosignal and demographic variables included in datasets in hopes of shedding light on what PPG data parameters are being used to develop medical devices.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Overview</title><p>This review will be reported in accordance with the standard PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) guidelines. The study has been registered with PROSPERO (CRD42024564759) [<xref ref-type="bibr" rid="ref15">15</xref>] before the initial literature search [<xref ref-type="bibr" rid="ref16">16</xref>]. The full planned search strategy is provided in the Supplementary Material in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, which has been developed in close concordance with a medical librarian (IK and EE). This search strategy includes the databases and data repositories: MedLine OVID, IEEE, SCOPUS, Physionet, National Sleep Research Resource, UC Irvine Machine Learning Repository, and Borealis.</p></sec><sec id="s2-2"><title>Eligibility Criteria</title><p>We will include any peer-reviewed primary studies&#x2014;observational and nonobservational&#x2014;which use PPG datasets. This includes PPG datasets in published randomized controlled trials, nonrandomized trials, cross-sectional studies, cohort studies, and algorithmic models.</p><p>We will include studies published since 2000 to ensure the datasets are relevant to current technology developments. The year of 2000 was defined as the lower bound to ensure the datasets selected for analysis are aligned with contemporary medical device design, especially since there has been a rise in usage of PPG datasets to train wearable health technologies in the last 2 decades. In the early 2000s, significant global health milestones like the Millennium Development Goals were established, marking a period in time when critical frameworks and health care initiatives for promoting greater equity and diversity were implemented. We plan to include studies that mention PPG and specifically reference openly accessible datasets. Therefore, accounts will be created to access datasets as needed; however, any datasets that require a fee or monetary incentive to access the datasets will be deemed as not openly accessible. The datasets must contain physiological parameters such as heart rate, blood pressure, or respiratory rate as well as data describing the waveform, such as pulse wave or slope transit time. These terms have been chosen as they are indicators of parameters routinely collected in PPG datasets. The inclusion and exclusion criteria are outlined in <xref ref-type="other" rid="box1">Textbox 1</xref>. Included studies will be evaluated for the extent to which they include demographic characteristics and consider these characteristics.</p><boxed-text id="box1"><title> Summary of inclusion and exclusion criteria.</title><p>Inclusion criteria</p><list list-type="bullet"><list-item><p>Openly accessible datasets</p></list-item><list-item><p>Literature containing datasets years 2000-present</p></list-item><list-item><p>Must contain photoplethysmography (PPG) signal and physiological parameters such as heart rate, blood pressure, or respiratory rate</p></list-item><list-item><p>Human studies</p></list-item><list-item><p>English and non-English articles, provided the non-English articles have datasets with English translation</p></list-item></list><p>Exclusion criteria</p><list list-type="bullet"><list-item><p>Animal studies</p></list-item><list-item><p>Lack of PPG signals</p></list-item><list-item><p>Primary literature without reference to datasets</p></list-item><list-item><p>Conference papers and abstracts</p></list-item></list></boxed-text><p>Datasets meeting the eligibility criteria will be included for analysis of demographic characteristics. Articles mentioning openly accessible datasets may be used to provide contextual information on the datasets, but only the datasets will be analyzed to ensure the primary objective of this review is focused on the reporting quality of openly accessible PPG datasets.</p></sec><sec id="s2-3"><title>Data Analysis</title><p>Following the initial literature search, all studies will be reviewed independently by two authors using systematic review software, Rayyan.ai [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. Studies will initially be screened by title and abstract. The full-text articles will then undergo screening. Disagreements will be discussed with and resolved by a third author, a senior author with expertise in the topic. At each step, studies will be retrieved only if they meet the eligibility criteria.</p><sec id="s2-3-1"><title>Information Sources</title><p>Databases including Medline OVID, IEEE Xplore, and Scopus have been searched for articles including relevant datasets or mentionings of dataset repositories. The latest search was completed in December 2024. Following this literature search, specific dataset repositories including Physionet and GitHub will be searched to provide any additional openly accessible datasets relevant to the eligibility criteria and aim of the systematic review.</p></sec><sec id="s2-3-2"><title>Risk of Bias</title><p>The studies will be assessed using the STANDING Together Initiative guidelines as a framework for evaluating the datasets, as there are no widely accepted tools for assessing the risk of bias of datasets [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref21">21</xref>]. The STANDING Together Initiative provides guidelines that address dataset diversity and inclusion to improve the transparency of dataset reporting [<xref ref-type="bibr" rid="ref19">19</xref>]. Though these recommendations do not make up a definitive risk of bias tool, they provide content areas for analyzing the datasets, as they promote greater transparency in the reporting of datasets used for training and developing medical devices.</p></sec><sec id="s2-3-3"><title>Synthesis of Results</title><p>After dataset extraction, a systematic analysis and summary of all included studies and datasets will be provided by describing their dataset characteristics and study outcomes. Due to the heterogeneity of the datasets included, the statistical analysis and summary will provide an overview of the current state of openly accessible PPG datasets and repositories. Details such as the devices, biosignals collected, clinical parameters (sample size), demographic characteristics (age, sex, race or ethnicity, skin tone, and BMI), and geographical information (country, health care setting, and dates) will provide insight into the dataset characteristics. We expect the need for stepwise data harmonization where variables included in the datasets will be extracted, compared, and stored in a CSV file format with standardized labeling. The analysis of the biosignal and demographic variables will be analyzed in R to allow for the creation of data visualizations and provide statistical comparisons of the variables included across the datasets. Quantitative analysis will allow this review to focus on the frequencies and counts of the measured biosignal and demographic data variables. This information will provide insight into the reporting quality of the datasets; however, the specific values or information collected within the dataset for each biosignal and demographic variable will not be analyzed, to ensure a broader understanding of dataset documentation.</p><p>Summary statistics will be provided based on the characteristics of the datasets. These will include descriptive statistics such as means, SD, and data visualizations depicting the distribution of demographic and geographical characteristics. Statistical analysis will be performed on the dataset characteristics, such as age, sex, race, ethnicity, skin tone, BMI, and other relevant parameters, including analysis on the frequency of the variables and other quantitative aspects extracted from the studies [<xref ref-type="bibr" rid="ref21">21</xref>]. Raw counts of the characteristics will be visualized as percentages or proportions to depict the array of demographic variables reported in the PPG datasets. These characteristics will also be analyzed using statistical tests such as chi-square for frequency and independence [<xref ref-type="bibr" rid="ref14">14</xref>]. These tests will provide insight into the differences in both the frequencies and the co-occurrence of demographic characteristics, respectively. Further analysis of the literature will contextualize why such differences may or may not be statistically significant. Visualizations such as histograms will include information on the mean ages, dataset sizes, and number of waveform characteristics reported. This analysis will provide insight into how datasets are structured and the amount of information reported in them to qualify potential reasons for statistically significant differences in dataset reporting. Additional statistical tests will be used, and information such as geographical or socioeconomic data will be displayed cartographically or in a heatmap to depict the geographical sources of PPG studies and datasets.</p></sec></sec><sec id="s2-4"><title>Limitations and Implications</title><p>We predict that there will be heterogeneity in the data reporting quality and the terminology used to signify specific variables; therefore, it is important to use broad inclusion criteria to capture relevant articles.</p><p>We also anticipate significant heterogeneity of demographic characteristics. Jiang et al [<xref ref-type="bibr" rid="ref19">19</xref>] reported that less than seven percent of physiological datasets, specifically those available on PhysioNet, include all 4 key demographic variables&#x2014;age, sex, race, and ethnicity. Consequently, it is important to not include these variables in our inclusion or exclusion criteria to truly understand the level to which PPG datasets consider demographic aspects including variables such as age, sex, race, ethnicity, and other relevant parameters like skin tone or BMI. Understanding the extent to which demographic parameters are collected in PPG datasets will therefore shed light on what information is used in informing the development and deployment of healthcare technology. By collecting information on the structural aspects of the PPG datasets, we will provide a critical comprehension of the reporting quality of openly accessible datasets.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><p>After the protocol was registered, the literature search was run in the databases IEEE, Scopus, and MedLine OVID in December 2024. The search yielded 1198 articles for initial screening. The openly accessible PPG datasets extracted from these repositories will be included in the analysis of demographic and biosignal data. The abstract screening phase has yielded 464 articles. The full-text screening is projected to be completed by July 2025. After which data analysis, detailed below, will be projected to be completed by September 2025.</p></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>Understanding the reporting quality of datasets used to develop health care technology is becoming increasingly important as the use of algorithmic models and processing to train medical devices grows. By analyzing openly accessible PPG datasets, we aim to provide a more comprehensive view of standard of data collection and usage for medical devices. Because of PPG&#x2019;s long-standing usage in medical devices since the 1970 s and the wide range of biosignals that can be extracted from PPG data, it is vital to increase transparency in the demographic information collected in tangent to the biosignal data. The principal finding from this review will be to extract the different demographic and biosignal characteristics listed in openly accessible PPG datasets. We will provide summary statistics including frequencies, proportions, and distributions of the number and types of dataset characteristics. These summary statistics will be visualized in diagrams like histograms and box-whisker plots as well as tables. Any additional information related to characteristics such as the geographical location of the data collection or socioeconomic status will be portrayed in heatmaps to provide a general overview of additional social variables.</p></sec><sec id="s4-2"><title>Comparison to Previous Work</title><p>Wearables including smartwatches are commonly used to track personal health measures such as heart rate, sleep, and blood pressure. These commercially available medical devices often use PPG to take physiological measurements. However, PPG data collected by wearables have been observed to be affected by skin tone and higher adipose tissue due to obesity [<xref ref-type="bibr" rid="ref12">12</xref>]. In combination, differences of up to 61% in signal intensity have been observed [<xref ref-type="bibr" rid="ref12">12</xref>]. The Fitzpatrick scale is commonly used to assess for differences in skin tone, and while it provides an insight into the physiological signal values caused by greater melanin levels, it is subjective and treats skin tone as a categorical, rather than a continuous, variable [<xref ref-type="bibr" rid="ref22">22</xref>]. This has limitations when considering the many underlying factors that result in the chromatic appearance of an individual&#x2019;s skin tone, particularly if complicated by clinical conditions such as jaundice or hypoxia. Exploring the extent to which variables such as this are captured within existing datasets may be instructive in understanding their inherent ability to account for overall skin coloration.</p><p>Clearly, this same need to account for diversity in skin tone and clinical condition applies to clinical PPG studies and their resultant datasets. In a clinical setting, having erroneous oxygen saturation values or heart rate measurements can result in poorer clinical outcomes. There is evidence that the obese and those with greater melanin content in their skin endure worse health outcomes, with inaccurate monitoring a clear potential contributor [<xref ref-type="bibr" rid="ref22">22</xref>]. Obesity can be attributed to physiological changes such as the reduction in trans-epidermal water loss and an increase in skin thickness due to adipose tissue can influence the light scattering patterns needed to obtain a PPG reading [<xref ref-type="bibr" rid="ref22">22</xref>]. In addition to melanin content and obesity, other factors influencing perfusion and skin temperature can all affect PPG. When expanding PPG technology to low-resource settings, there is a need to account for diverse populations not only in terms of melanation but also factors such as obesity and conditions altering perfusion. Moreover, they may have a greater diversity of endemic clinical conditions including anemia, parasitemia, and malnutrition&#x2014;whose effects on PPG have not been clearly described. Effective clinical PPG monitoring in these patients mandates an interpretation based on data from representative populations.</p><p>This understanding of demographic and biosignal variables is critical to presenting the current standard of reporting quality across openly accessible PPG datasets. In a recent review of PhysioNet datasets, a data repository with biosignal datasets, information regarding demographic and geographical information was presented to highlight the disparities and demographic gaps present in biosignal datasets [<xref ref-type="bibr" rid="ref19">19</xref>]. This marks the analysis of openly accessible PPG datasets relevant and important for promoting transparency and equity in medical device development, as PPG is a widely accepted technology growing in popularity in health care. The aims of this systematic review mirror those of the review by Jiang et al [<xref ref-type="bibr" rid="ref19">19</xref>], but take a broader look at openly accessible PPG datasets across multiple databases and repositories.</p></sec><sec id="s4-3"><title>Strengths and Limitations</title><p>Providing a detailed summary of the demographic and biosignal variables in openly available datasets, we aim to promote a more comprehensive understanding of reporting standards in existing PPG datasets. This review will provide a structured overview of the current gaps and sources of bias in developing PPG-based medical devices. Transparency in dataset reporting will highlight the need for greater diversity and promote an increased range of demographic characteristics collected in openly available PPG datasets. However, we do expect limitations such as heterogeneity in the datasets, especially as it comes to which characteristics are collected and included in the datasets. We also anticipate challenges in gaining access to certain datasets as we will likely have to go through repositories or databases that require account creation or multiple steps in gaining access to the PPG databases. These limitations will be mitigated by maintaining clear documentation of the characteristics extracted from the datasets being analyzed and data harmonization. Also, accounts will be created as needed to ensure adequate access is gained to review the dataset characteristics.</p></sec><sec id="s4-4"><title>Future Directions</title><p>In this systematic review, we will analyze the structural basis of PPG datasets and critically evaluate the different variables included in the datasets. This analysis will highlight the reporting quality of openly accessible PPG datasets. By critically appraising the dataset diversity and reporting quality, we can highlight the gaps present in current PPG data to inform future collection and design of medical devices including wearables to be more inclusive to avoid perpetuating biases. In addition, by looking at the structure of PPG datasets and their representativeness, we can also provide insight into the gaps that may be present in the context of PPG applications in low-resource settings. The findings can promote awareness of sources of bias in openly accessible PPG datasets, informing future data collection and modulation when training PPG-based medical technology. With the synthesis of this information and data analysis, we hope that medical device developers would consider dataset level biases and their implications on human health. We hope that these considerations would push toward greater transparency in PPG data collection and extraction of demographic and biosignal characteristics to ensure users are informed of the design and development of medical devices and avenues for promoting fairness. This review, therefore, aims to address disparities in openly available PPG datasets, the downstream effects of these disparities, and potential avenues for greater equity in PPG dataset creation and usage.</p></sec></sec></body><back><ack><p>We would like to acknowledge the medical librarians Ms Isla Kuhn and Ms Emma Etteridge for their help in developing the search strategy for this systematic review.</p><p>LH, BGS, and TB are funded by the National Institute for Health and Care Research (NIHR; NIHR132455) using UK aid from the UK Government to support global health research; the views expressed in this publication are those of the author(s) and not necessarily those of the NIHR or the UK Government. In addition, TB and BGS have received funding from Abbott, the Wellcome Trust, the Cambridge Biomedical Research Centre, and other NIHR awards. None of these funding sources directly contributed to the preparation of this manuscript. LR is supported by an NIHR Academic Clinical Fellowship. PHC acknowledges funding from the British Heart Foundation (FS/20/20/34626).</p></ack><notes><sec><title>Data Availability</title><p>All data generated or analyzed during this study are included in this published article and its supplementary information files.</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization: VP (lead), LR (equal), PHC (equal), TB (equal)</p><p>Data curation: VP (lead), LR (equal)</p><p>Formal analysis: VP (lead), LR (equal), PHC (supporting), TB (supporting)</p><p>Funding acquisition: No specific funding has been sourced for this work</p><p>Investigation: VP (lead), LR (equal)</p><p>Methodology: VP (lead), LR (equal), PHC (equal), TB (equal)</p><p>Project administration: TB (lead), PHC (equal)</p><p>Resources: VP (lead), LR (equal), PHC (equal), TB (equal)</p><p>Supervision: TB (lead), PHC (equal), LR (equal)</p><p>Validation: VP (lead), LR (equal), PHC (equal), TB (equal),</p><p>Visualization: VP (lead), LR (equal), BGS (supporting), SN (supporting), PHC (supporting), TB (supporting)</p><p>Writing&#x2013;original draft: VP (lead), LR (equal), PHC (supporting), TB (supporting)</p><p>Writing&#x2013;review &#x0026; editing: VP (lead), LR (equal), PHC (supporting), TB (supporting), BGS (supporting), SN (supporting), OM (supporting), TE (supporting), LH (supporting)</p></fn><fn fn-type="conflict"><p>PHC is employed by Nokia Bell Labs. He has performed consultancy work for Cambridge University Technical Services, has received travel funds from VascAgeNet, and has received honoraria from IOP Publishing and Emory University (the latter not received personally).</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">PPG</term><def><p>Photoplethysmography</p></def></def-item><def-item><term id="abb2">PRISMA</term><def><p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Castaneda</surname><given-names>D</given-names> </name><name name-style="western"><surname>Esparza</surname><given-names>A</given-names> </name><name name-style="western"><surname>Ghamari</surname><given-names>M</given-names> </name><name name-style="western"><surname>Soltanpur</surname><given-names>C</given-names> </name><name name-style="western"><surname>Nazeran</surname><given-names>H</given-names> </name></person-group><article-title>A review on wearable photoplethysmography sensors and their potential future applications in health care</article-title><source>Int J Biosens Bioelectron</source><year>2018</year><volume>4</volume><issue>4</issue><fpage>195</fpage><lpage>202</lpage><pub-id pub-id-type="doi">10.15406/ijbsbe.2018.04.00125</pub-id><pub-id pub-id-type="medline">30906922</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Park</surname><given-names>J</given-names> </name><name name-style="western"><surname>Seok</surname><given-names>HS</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>SS</given-names> </name><name name-style="western"><surname>Shin</surname><given-names>H</given-names> </name></person-group><article-title>Photoplethysmogram analysis and applications: an integrative review</article-title><source>Front Physiol</source><year>2022</year><month>03</month><day>1</day><access-date>2025-09-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/journals/physiology/articles/10.3389/fphys.2021.808451/full">https://www.frontiersin.org/journals/physiology/articles/10.3389/fphys.2021.808451/full</ext-link></comment></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Almarshad</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Islam</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Al-Ahmadi</surname><given-names>S</given-names> </name><name name-style="western"><surname>BaHammam</surname><given-names>AS</given-names> </name></person-group><article-title>Diagnostic Features and Potential Applications of PPG Signal in Healthcare: A Systematic Review</article-title><source>Healthcare (Basel)</source><year>2022</year><month>03</month><day>16</day><volume>10</volume><issue>3</issue><fpage>547</fpage><pub-id pub-id-type="doi">10.3390/healthcare10030547</pub-id><pub-id pub-id-type="medline">35327025</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Tang</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Guo</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Liang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Ward</surname><given-names>R</given-names> </name><name name-style="western"><surname>Menon</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Robust reconstruction of electrocardiogram using photoplethysmography: a subject-based model</article-title><source>Front Physiol</source><year>2025</year><month>04</month><day>25</day><access-date>2025-09-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/journals/physiology/articles/10.3389/fphys.2022.859763/full">https://www.frontiersin.org/journals/physiology/articles/10.3389/fphys.2022.859763/full</ext-link></comment></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Loh</surname><given-names>HW</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>S</given-names> </name><name name-style="western"><surname>Faust</surname><given-names>O</given-names> </name><etal/></person-group><article-title>Application of photoplethysmography signals for healthcare systems: An in-depth review</article-title><source>Comput Methods Programs Biomed</source><year>2022</year><month>04</month><volume>216</volume><fpage>106677</fpage><pub-id pub-id-type="doi">10.1016/j.cmpb.2022.106677</pub-id><pub-id pub-id-type="medline">35139459</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>SH</given-names> </name><name name-style="western"><surname>Chuang</surname><given-names>YC</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>CC</given-names> </name></person-group><article-title>Development of a Portable All-Wavelength PPG Sensing Device for Robust Adaptive-Depth Measurement: A Spectrometer Approach with a Hydrostatic Measurement Example</article-title><source>Sensors (Basel)</source><year>2020</year><month>11</month><day>17</day><volume>20</volume><issue>22</issue><fpage>6556</fpage><pub-id pub-id-type="doi">10.3390/s20226556</pub-id><pub-id pub-id-type="medline">33212798</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Feiner</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Severinghaus</surname><given-names>JW</given-names> </name><name name-style="western"><surname>Bickler</surname><given-names>PE</given-names> </name></person-group><article-title>Dark skin decreases the accuracy of pulse oximeters at low oxygen saturation: the effects of oximeter probe type and gender</article-title><source>Anesthesia &#x0026; Analgesia</source><year>2025</year><month>01</month><day>20</day><access-date>2025-09-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://journals.lww.com/anesthesia-analgesia/fulltext/2007/12001/dark_skin_decreases_the_accuracy_of_pulse.4.aspx">https://journals.lww.com/anesthesia-analgesia/fulltext/2007/12001/dark_skin_decreases_the_accuracy_of_pulse.4.aspx</ext-link></comment></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abay</surname><given-names>TY</given-names> </name><name name-style="western"><surname>Kyriacou</surname><given-names>PA</given-names> </name></person-group><article-title>Photoplethysmography for blood volumes and oxygenation changes during intermittent vascular occlusions</article-title><source>J Clin Monit Comput</source><year>2018</year><month>06</month><volume>32</volume><issue>3</issue><fpage>447</fpage><lpage>455</lpage><pub-id pub-id-type="doi">10.1007/s10877-017-0030-2</pub-id><pub-id pub-id-type="medline">28547651</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mo&#x00E7;o</surname><given-names>AV</given-names> </name><name name-style="western"><surname>Stuijk</surname><given-names>S</given-names> </name><name name-style="western"><surname>de Haan</surname><given-names>G</given-names> </name></person-group><article-title>Skin inhomogeneity as a source of error in remote PPG-imaging</article-title><source>Biomed Opt Express</source><year>2016</year><month>11</month><day>1</day><volume>7</volume><issue>11</issue><fpage>4718</fpage><lpage>4733</lpage><pub-id pub-id-type="doi">10.1364/BOE.7.004718</pub-id><pub-id pub-id-type="medline">27896011</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Yan</surname><given-names>BPY</given-names> </name><name name-style="western"><surname>Dai</surname><given-names>WX</given-names> </name><name name-style="western"><surname>Ding</surname><given-names>XR</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>YT</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>N</given-names> </name></person-group><article-title>Multi-wavelength photoplethysmography method for skin arterial pulse extraction</article-title><source>Biomed Opt Express</source><year>2016</year><month>10</month><day>1</day><volume>7</volume><issue>10</issue><fpage>4313</fpage><lpage>4326</lpage><pub-id pub-id-type="doi">10.1364/BOE.7.004313</pub-id><pub-id pub-id-type="medline">27867733</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>McMurray</surname><given-names>JP</given-names> </name><name name-style="western"><surname>Branan</surname><given-names>KL</given-names> </name><name name-style="western"><surname>Hsiao</surname><given-names>CT</given-names> </name><name name-style="western"><surname>Idah-Oze</surname><given-names>S</given-names> </name><name name-style="western"><surname>Thrailkill</surname><given-names>A</given-names> </name><name name-style="western"><surname>Cot&#x00E9;</surname><given-names>GL</given-names> </name></person-group><article-title>Multiwavelength photoplethysmography signal analysis as a function of varied wrist contact pressure</article-title><conf-name>Optical Diagnostics and Sensing XXIII: Toward Point-of-Care Diagnostics</conf-name><conf-date>Jan 20, 2023</conf-date><conf-loc>San Francisco, United States</conf-loc><fpage>31</fpage><lpage>35</lpage><pub-id pub-id-type="doi">10.1117/12.2649531</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="web"><article-title>Monte carlo analysis of optical heart rate sensors in commercial wearables: the effect of skin tone and obesity on the photoplethysmography (PPG) signal</article-title><source>Biomed Opt Express</source><year>2021</year><month>11</month><day>10</day><access-date>2025-09-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://opg.optica.org/boe/fulltext.cfm?uri=boe-12-12-7445&#x0026;id=464758">https://opg.optica.org/boe/fulltext.cfm?uri=boe-12-12-7445&#x0026;id=464758</ext-link></comment></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sjoding</surname><given-names>MW</given-names> </name><name name-style="western"><surname>Dickson</surname><given-names>RP</given-names> </name><name name-style="western"><surname>Iwashyna</surname><given-names>TJ</given-names> </name><name name-style="western"><surname>Gay</surname><given-names>SE</given-names> </name><name name-style="western"><surname>Valley</surname><given-names>TS</given-names> </name></person-group><article-title>Racial Bias in Pulse Oximetry Measurement</article-title><source>N Engl J Med</source><year>2020</year><month>12</month><day>17</day><volume>383</volume><issue>25</issue><fpage>2477</fpage><lpage>2478</lpage><pub-id pub-id-type="doi">10.1056/NEJMc2029240</pub-id><pub-id pub-id-type="medline">33326721</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Sjoding</surname><given-names>MW</given-names> </name><name name-style="western"><surname>Dickson</surname><given-names>RP</given-names> </name><name name-style="western"><surname>Iwashyna</surname><given-names>TJ</given-names> </name><name name-style="western"><surname>Gay</surname><given-names>SE</given-names> </name><name name-style="western"><surname>Valley</surname><given-names>TS</given-names> </name></person-group><article-title>Racial bias in pulse oximetry measurement</article-title><source>N Engl J Med</source><year>2025</year><month>12</month><day>17</day><access-date>2025-09-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www-nejm-org.laneproxy.stanford.edu/doi/full/10.1056/NEJMc2029240">https://www-nejm-org.laneproxy.stanford.edu/doi/full/10.1056/NEJMc2029240</ext-link></comment></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="web"><article-title>PROSPERO home page</article-title><source>National Institute for Health and Care Research</source><access-date>2025-09-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.crd.york.ac.uk/prospero/">https://www.crd.york.ac.uk/prospero/</ext-link></comment></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Penmetcha</surname><given-names>V</given-names> </name><name name-style="western"><surname>Rambabu</surname><given-names>L</given-names> </name><name name-style="western"><surname>Smith</surname><given-names>B</given-names> </name><name name-style="western"><surname>Bashford</surname><given-names>T</given-names> </name><name name-style="western"><surname>Charlton</surname><given-names>P</given-names> </name></person-group><article-title>Evaluating the characteristics of open access photoplethysmography datasets</article-title><source>PROSPERO</source><year>2024</year><access-date>2025-09-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.crd.york.ac.uk/PROSPERO/view/CRD42024564759">https://www.crd.york.ac.uk/PROSPERO/view/CRD42024564759</ext-link></comment></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ouzzani</surname><given-names>M</given-names> </name><name name-style="western"><surname>Hammady</surname><given-names>H</given-names> </name><name name-style="western"><surname>Fedorowicz</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Elmagarmid</surname><given-names>A</given-names> </name></person-group><article-title>Rayyan-a web and mobile app for systematic reviews</article-title><source>Syst Rev</source><year>2016</year><month>12</month><day>5</day><volume>5</volume><issue>1</issue><fpage>210</fpage><pub-id pub-id-type="doi">10.1186/s13643-016-0384-4</pub-id><pub-id pub-id-type="medline">27919275</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="web"><source>Rayyan</source><access-date>2025-09-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.rayyan.ai/">https://www.rayyan.ai/</ext-link></comment></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jiang</surname><given-names>S</given-names> </name><name name-style="western"><surname>Ashar</surname><given-names>P</given-names> </name><name name-style="western"><surname>Shandhi</surname><given-names>MMH</given-names> </name><name name-style="western"><surname>Dunn</surname><given-names>J</given-names> </name></person-group><article-title>Demographic reporting in biosignal datasets: a comprehensive analysis of the PhysioNet open access database</article-title><source>Lancet Digit Health</source><year>2024</year><month>11</month><volume>6</volume><issue>11</issue><fpage>e871</fpage><lpage>e878</lpage><pub-id pub-id-type="doi">10.1016/S2589-7500(24)00170-5</pub-id><pub-id pub-id-type="medline">39358064</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alderman</surname><given-names>JE</given-names> </name><name name-style="western"><surname>Palmer</surname><given-names>J</given-names> </name><name name-style="western"><surname>Laws</surname><given-names>E</given-names> </name><etal/></person-group><article-title>Tackling algorithmic bias and promoting transparency in health datasets: the STANDING Together consensus recommendations</article-title><source>Lancet Digit Health</source><year>2025</year><month>01</month><volume>7</volume><issue>1</issue><fpage>e64</fpage><lpage>e88</lpage><pub-id pub-id-type="doi">10.1016/S2589-7500(24)00224-3</pub-id><pub-id pub-id-type="medline">39701919</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alderman</surname><given-names>JE</given-names> </name><name name-style="western"><surname>Charalambides</surname><given-names>M</given-names> </name><name name-style="western"><surname>Sachdeva</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Revealing transparency gaps in publicly available COVID-19 datasets used for medical artificial intelligence development-a systematic review</article-title><source>Lancet Digit Health</source><year>2024</year><month>11</month><volume>6</volume><issue>11</issue><fpage>e827</fpage><lpage>e847</lpage><pub-id pub-id-type="doi">10.1016/S2589-7500(24)00146-8</pub-id><pub-id pub-id-type="medline">39455195</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="web"><article-title>Wound care and skin tone: signs, symptoms and terminology for all skin tones</article-title><source>Wounds Asia</source><year>2025</year><month>01</month><day>20</day><access-date>2025-09-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://woundsasia.com/journal-articles/wound-care-and-skin-tone-signs-symptoms-and-terminology-for-all-skin-tones/">https://woundsasia.com/journal-articles/wound-care-and-skin-tone-signs-symptoms-and-terminology-for-all-skin-tones/</ext-link></comment></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Search strategy.</p><media xlink:href="resprot_v14i1e73040_app1.docx" xlink:title="DOCX File, 14 KB"/></supplementary-material><supplementary-material id="app2"><label>Checklist 1</label><p>PRISMA-P checklist.</p><media xlink:href="resprot_v14i1e73040_app2.pdf" xlink:title="PDF File, 220 KB"/></supplementary-material></app-group></back></article>