<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Digit. Health</journal-id>
<journal-title>Frontiers in Digital Health</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Digit. Health</abbrev-journal-title>
<issn pub-type="epub">2673-253X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fdgth.2025.1534830</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Digital Health</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>An AI-based module for interstitial glucose forecasting enabling a &#x201C;Do-It-Yourself&#x201D; application for people with type 1 diabetes</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes"><name><surname>Rodriguez-Almeida</surname><given-names>Antonio J.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="cor1">&#x002A;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2905562/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/><role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/><role content-type="https://credit.niso.org/contributor-roles/data-curation/"/><role content-type="https://credit.niso.org/contributor-roles/investigation/"/><role content-type="https://credit.niso.org/contributor-roles/software/"/></contrib>
<contrib contrib-type="author"><name><surname>Socorro-Marrero</surname><given-names>Guillermo V.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/><role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/><role content-type="https://credit.niso.org/contributor-roles/investigation/"/></contrib>
<contrib contrib-type="author"><name><surname>Betancort</surname><given-names>Carmelo</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/><role content-type="https://credit.niso.org/contributor-roles/data-curation/"/><role content-type="https://credit.niso.org/contributor-roles/visualization/"/></contrib>
<contrib contrib-type="author"><name><surname>Zamora-Zamorano</surname><given-names>Garlene</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/><role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/><role content-type="https://credit.niso.org/contributor-roles/investigation/"/><role content-type="https://credit.niso.org/contributor-roles/visualization/"/></contrib>
<contrib contrib-type="author"><name><surname>Deniz-Garcia</surname><given-names>Alejandro</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/><role content-type="https://credit.niso.org/contributor-roles/visualization/"/></contrib>
<contrib contrib-type="author"><name><surname>&#x00C1;lvarez-Mal&#x00E9;</surname><given-names>Mar&#x00ED;a L.</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/><role content-type="https://credit.niso.org/contributor-roles/investigation/"/><role content-type="https://credit.niso.org/contributor-roles/visualization/"/></contrib>
<contrib contrib-type="author"><name><surname>&#x00C5;rsand</surname><given-names>Eirik</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/><role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/></contrib>
<contrib contrib-type="author"><name><surname>Soguero-Ruiz</surname><given-names>Cristina</given-names></name>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/><role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/></contrib>
<contrib contrib-type="author"><name><surname>W&#x00E4;gner</surname><given-names>Ana M.</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref><uri xlink:href="https://loop.frontiersin.org/people/851453/overview"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/><role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/></contrib>
<contrib contrib-type="author"><name><surname>Granja</surname><given-names>Concei&#x00E7;&#x00E3;o</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="aff" rid="aff7"><sup>7</sup></xref><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/><role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/></contrib>
<contrib contrib-type="author"><name><surname>Callico</surname><given-names>Gustavo M.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/><role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/><role content-type="https://credit.niso.org/contributor-roles/supervision/"/><role content-type="https://credit.niso.org/contributor-roles/resources/"/></contrib>
<contrib contrib-type="author" corresp="yes"><name><surname>Fabelo</surname><given-names>Himar</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff8"><sup>8</sup></xref>
<xref ref-type="aff" rid="aff9"><sup>9</sup></xref>
<xref ref-type="corresp" rid="cor1">&#x002A;</xref><uri xlink:href="https://loop.frontiersin.org/people/2373056/overview" /><role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/><role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/><role content-type="https://credit.niso.org/contributor-roles/investigation/"/><role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/><role content-type="https://credit.niso.org/contributor-roles/supervision/"/></contrib>
</contrib-group>
<aff id="aff1"><label><sup>1</sup></label><institution>Institute for Applied Microelectronics, University of Las Palmas de Gran Canaria, ULPGC</institution>, <addr-line>Las Palmas de Gran Canaria</addr-line>, <country>Spain</country></aff>
<aff id="aff2"><label><sup>2</sup></label><institution>Endocrinology and Nutrition Department, Complejo Hospitalario Universitario Insular Materno-Infantil, CHUIMI</institution>, <addr-line>Las Palmas de Gran Canaria</addr-line>, <country>Spain</country></aff>
<aff id="aff3"><label><sup>3</sup></label><institution>Instituto de Investigaciones Biom&#x00E9;dicas y Sanitarias, University of de Las Palmas de Gran Canaria, ULPGC</institution>, <addr-line>Las Palmas de Gran Canaria</addr-line>, <country>Spain</country></aff>
<aff id="aff4"><label><sup>4</sup></label><institution>Department of Computer Science, University of Troms&#x00F8;&#x2014;The Arctic University of Norway</institution>, <addr-line>Troms&#x00F8;</addr-line>, <country>Norway</country></aff>
<aff id="aff5"><label><sup>5</sup></label><institution>Norwegian Centre for E-health Research, University Hospital of North-Norway, UNN</institution>, <addr-line>Troms&#x00F8;</addr-line>, <country>Norway</country></aff>
<aff id="aff6"><label><sup>6</sup></label><institution>Department of Signal Theory and Communications, Telematics and Computing Systems, Rey Juan Carlos University, URJC</institution>, <addr-line>Fuenlabrada</addr-line>, <country>Spain</country></aff>
<aff id="aff7"><label><sup>7</sup></label><institution>Faculty of Nursing and Health Sciences, Nord University, NU</institution>, <addr-line>Bod&#x00F8;</addr-line>, <country>Norway</country></aff>
<aff id="aff8"><label><sup>8</sup></label><institution>Fundaci&#x00F3;n Canaria Instituto de Investigaci&#x00F3;n Sanitaria de Canarias, FIISC</institution>, <addr-line>Las Palmas de Gran Canaria</addr-line>, <country>Spain</country></aff>
<aff id="aff9"><label><sup>9</sup></label><institution>Research Unit, Hospital Universitario de Gran Canaria Dr. Negrin</institution>, <addr-line>Las Palmas de Gran Canaria</addr-line>, <country>Spain</country></aff>
<author-notes>
<fn fn-type="edited-by"><p><bold>Edited by:</bold> Gururaj H. L., Manipal Institute of Technology, India</p></fn>
<fn fn-type="edited-by"><p><bold>Reviewed by:</bold> Hong Lin, University of Houston&#x2013;Downtown, United States</p>
<p>Nicolas Medrano, University of Zaragoza, Spain</p></fn>
<corresp id="cor1"><label>&#x002A;</label><bold>Correspondence:</bold> Antonio J. Rodr&#x00ED;guez-Almeida <email>aralmeida@iuma.ulpgc.es</email> Himar Fabelo <email>hfabelo@iuma.ulpgc.es</email></corresp>
</author-notes>
<pub-date pub-type="epub"><day>13</day><month>06</month><year>2025</year></pub-date>
<pub-date pub-type="collection"><year>2025</year></pub-date>
<volume>7</volume><elocation-id>1534830</elocation-id>
<history>
<date date-type="received"><day>26</day><month>11</month><year>2024</year></date>
<date date-type="accepted"><day>19</day><month>05</month><year>2025</year></date>
</history>
<permissions>
<copyright-statement>&#x00A9; 2025 Rodriguez-Almeida, Socorro-Marrero, Betancort, Zamora-Zamorano, Deniz-Garcia, &#x00C1;lvarez-Mal&#x00E9;, &#x00C5;rsand, Soguero-Ruiz, W&#x00E4;gner, Granja, Callico and Fabelo.</copyright-statement>
<copyright-year>2025</copyright-year><copyright-holder>Rodriguez-Almeida, Socorro-Marrero, Betancort, Zamora-Zamorano, Deniz-Garcia, &#x00C1;lvarez-Mal&#x00E9;, &#x00C5;rsand, Soguero-Ruiz, W&#x00E4;gner, Granja, Callico and Fabelo</copyright-holder><license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract><sec><title>Introduction</title>
<p>Diabetes mellitus (DM) is a chronic condition defined by increased blood glucose that affects more than 500 million adults. Type 1 diabetes (T1D) needs to be treated with insulin. Keeping glucose within the desired range is challenging. Despite the advances in the mHealth field, the appearance of the do-it-yourself (DIY) tools, and the progress in glucose level prediction based on deep learning (DL), these tools fail to engage the users in the long-term. This limits the benefits that they could have on the daily T1D self-management, specifically by providing an accurate prediction of their short-term glucose level.</p>
</sec><sec><title>Methods</title>
<p>This work proposed a DL-based DIY framework for interstitial glucose prediction using continuous glucose monitoring (CGM) data to generate one personalized DL model per user, without using data from other people. The DIY module reads the CGM raw data (as it would be uploaded by the potential users of this tool), and automatically prepares them to train and validate a DL model to perform glucose predictions up to one hour ahead. For training and validation, 1 year of CGM data collected from 29 subjects with T1D were used.</p>
</sec><sec><title>Results and Discussion</title>
<p>Results showed prediction performance comparable to the state-of-the-art, using only CGM data. To the best of our knowledge, this work is the first one in providing a DL-based DIY approach for fully personalized glucose prediction. Moreover, this framework is open source and has been deployed in Docker, enabling its standalone use, its integration on a smartphone application, or the experimentation with novel DL architectures.</p>
</sec>
</abstract>
<kwd-group>
<kwd>type 1 diabetes</kwd>
<kwd>deep learning</kwd>
<kwd>personalized medicine</kwd>
<kwd>continuous glucose monitoring</kwd>
<kwd>mHealth</kwd>
</kwd-group><contract-num rid="cn001">101017385</contract-num><contract-sponsor id="cn001">European Union&#x0027;s Horizon 2020</contract-sponsor><counts>
<fig-count count="7"/>
<table-count count="3"/><equation-count count="54"/><ref-count count="61"/><page-count count="22"/><word-count count="0"/></counts><custom-meta-wrap><custom-meta><meta-name>section-at-acceptance</meta-name><meta-value>Health Communications and Behavior Change</meta-value></custom-meta></custom-meta-wrap>
</article-meta>
</front>
<body><sec id="s1" sec-type="intro"><label>1</label><title>Introduction</title>
<p>Diabetes Mellitus (DM) is a chronic metabolic condition characterized by increased blood glucose level concentrations, which was suffered by around 537 million adults in 2021, representing nearly 10&#x0025; of the world population (<xref ref-type="bibr" rid="B1">1</xref>). Moreover, the number of people with diabetes will potentially grow to 643 million by 2030, with an estimation of over 6.7 million deaths from diabetes-related issues (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B2">2</xref>). Chronic hyperglycemia may lead to DM-associated complications, including damage to the heart, eyes, kidneys, blood vessels and nerves, seriously affecting the quality of life of those who suffer it (<xref ref-type="bibr" rid="B3">3</xref>). The two main types of DM are type 2 diabetes, caused by an increased resistance to insulin, where the body is not able to secrete enough insulin to overcome such resistance, and Type 1 Diabetes (T1D), which results from autoimmune, pancreatic beta-cell destructions that ends in a complete lack of insulin production (<xref ref-type="bibr" rid="B3">3</xref>, <xref ref-type="bibr" rid="B4">4</xref>).</p>
<p>Particularly, T1D is the main type of diabetes in childhood, although it can occur at any point in life. It accounts for 8.75 million people globally, 1.52 million of them being less than 20 years old by year 2021 (<xref ref-type="bibr" rid="B1">1</xref>). T1D treatment is a challenge, since imperfect, exogenous insulin administration aims to mimic (inexistent) endogenous insulin production, to keep glucose concentrations within a safe range, avoiding hyper- and hypoglycemia (high and low blood glucose levels, respectively). An individual with T1D experiences around two episodes of symptomatic hypoglycemia per week, which is directly associated with an increase in morbidity and mortality (<xref ref-type="bibr" rid="B5">5</xref>, <xref ref-type="bibr" rid="B6">6</xref>). Due to the threat that these recurrent hypoglycemic events entail, T1D requires a lifetime of thorough self-management. To maintain the blood glucose levels in an appropriate range, people with T1D require daily administration of insulin, otherwise their lives would be seriously endangered. This control, together with regular consultations with an endocrinologist, are crucial to achieve good metabolic control, being able to live a healthy life and potentially mitigating the hardest long-term complications of T1D (<xref ref-type="bibr" rid="B3">3</xref>, <xref ref-type="bibr" rid="B7">7</xref>).</p>
<p>T1D self-management mainly includes glucose monitoring and subcutaneous insulin administration. Current glucose monitoring tools can be classified in two groups: capillary blood glucose measurements, which requires a puncture in a finger to extract a blood drop with a glucometer, and Continuous interstitial Glucose Monitoring (CGM), a technique that has become standard of care in many countries, and whose cost decrease and accuracy improvements will likely contribute to its expansion in the short-term (<xref ref-type="bibr" rid="B8">8</xref>). CGM devices use a sensor attached to the subject&#x0027;s skin that monitors interstitial glucose concentrations (typically every 5 or 15&#x2005;min, depending on the model of the sensor) (<xref ref-type="bibr" rid="B9">9</xref>). <xref ref-type="sec" rid="s11">Supplementary Figure S1a</xref> depicts a segment of a CGM signal. There is an international consensus to establish the guidance for assessment glycemic control taking the CGM as reference, although glucometers are still more accurate than CGM sensors. The target glucose range is 70&#x2013;180&#x2005;mg/dl, and the time spent within these values is called Time In Range (TIR). TIR is recommended to be greater than 70&#x0025; daily. The Time Above Range (TAR), i.e., with glucose concentrations over 180 mg/dl is advisable to be less than 25&#x0025;, whereas the Time Below Range (TBR), should not be more than 4&#x0025; of the day, corresponding to less than one hour (<xref ref-type="bibr" rid="B10">10</xref>). Therefore, the T1D individual&#x0027;s goal is to have the highest TIR possible, decreasing the TAR and TBR as much as possible. The visualization standard of these ranges in T1D dedicated mobile applications is illustrated in <xref ref-type="sec" rid="s11">Supplementary Figure S1b</xref>.</p>
<p>Current functionalities for the available commercialized CGM devices are the glucose data transfer to a display device (e.g., a smartphone), sometimes triggering alarms about the probable arise of hyper- or hypoglycemia episodes (<xref ref-type="bibr" rid="B9">9</xref>). CGM has proven to reduce the number of hypoglycemic events in people with T1D (<xref ref-type="bibr" rid="B11">11</xref>). Besides, continuous glucose sensors have also enabled the communication of the glucose readings to the insulin pumps, giving rise to the so-called hybrid closed loop systems, where basal and correction insulin infusions are automated, but the mealtime insulin is not, since there are no commercially available systems that provide meal information automatically (<xref ref-type="bibr" rid="B9">9</xref>).</p>
<p>Lately, mobile Health (mHealth) applications have been increasingly employed to enhance chronic conditions management, which is crucial to improve the individual&#x0027;s health outcomes (<xref ref-type="bibr" rid="B12">12</xref>). However, they have failed to address the challenge of individual&#x0027;s long-term non-adherence to the tools themselves, due mainly to data privacy concerns, lack of perceived usefulness, non-optimal usability and the potential costs associated to their use (<xref ref-type="bibr" rid="B13">13</xref>). Seeking engagement in mHealth applications, and to overcome the bureaucratic delays associated with regulatory processes, the <italic>Do-It-Yourself</italic> (DIY) approach has gained popularity recently (<xref ref-type="bibr" rid="B2">2</xref>). This approach facilitates the self-management of an individual&#x0027;s condition by easy access to their health data. In the diabetes field, the turning point arrived in 2014 with the <italic>Nightscout Project</italic>, the first reported DIY mHealth application for people with diabetes (<xref ref-type="bibr" rid="B14">14</xref>). In 2022, Morrison et al. published a review of DIY systems used in people with T1D, evidencing that people are willing to use this kind of systems rather than the commercial ones (<xref ref-type="bibr" rid="B15">15</xref>). Additionally, in this approach the individuals are the digital tool providers, instead of medical companies, thus enabling an easy-to-use and subject-driven approach (<xref ref-type="bibr" rid="B16">16</xref>), which is strongly related with the tool engagement and usability (<xref ref-type="bibr" rid="B17">17</xref>). Furthermore, DIY systems have demonstrated to be effective in the glycemic control in people with diabetes (<xref ref-type="bibr" rid="B18">18</xref>). Although in the diabetes context DIY refers to people with this condition developing the tool by themselves, in this work this term refers to their indirect participation through the co-creation process of this module, the fact that this open source module allows individuals to generate their own personalized models using their data, together with the fact that researchers and/or software developers could implement further improvements on it, and implement it as an smartphone application.</p>
<p>Summarizing, despite the outlined advances in glucose monitoring, most people with T1D do not reach optimal glycemic control (<xref ref-type="bibr" rid="B19">19</xref>). Although there are diverse reasons that explain this, the most relevant factors that could be mitigated by the implementation of a personalized AI-based tool are:
<list list-type="simple">
<list-item><label>a.</label>
<p>The high intra-subject variability in CGM measurements in people with T1D, the errors in glucose measurements and the delay in the control actions (<xref ref-type="bibr" rid="B20">20</xref>).</p></list-item>
<list-item><label>b.</label>
<p>The suboptimal usability of the current available digital tools for T1D management, that ends on the disregard of many individuals for them (<xref ref-type="bibr" rid="B17">17</xref>).</p></list-item>
<list-item><label>c.</label>
<p>The lack of personalization in the available digital tools that could provide accurate and customized feedback, considering individual metabolism, environment, or digital alphabetization (<xref ref-type="bibr" rid="B2">2</xref>).</p></list-item>
</list>An accurate and reliable prediction of the glucose concentration in the next minutes or hours would certainly support individuals, anticipating possible hyper- and hypoglycemic events. This knowledge is already included in the hybrid close-loop systems to improve the insulin delivery (<xref ref-type="bibr" rid="B21">21</xref>). There are numerous studies that have assessed this task using mainly three approaches. Physiological models use equations to describe human metabolism; data-driven models, where this work is enclosed, are based on time series analysis and Machine/Deep learning (ML/DL) techniques; and hybrid models are a combination of the above (<xref ref-type="bibr" rid="B22">22</xref>, <xref ref-type="bibr" rid="B23">23</xref>). The data-driven models are the ones that have presented the best prediction performance so far (<xref ref-type="bibr" rid="B22">22</xref>). Most of the studies, including those with the most accurate predictions, are based on Convolutional Neural Networks (CNNs) (<xref ref-type="bibr" rid="B24">24</xref>, <xref ref-type="bibr" rid="B25">25</xref>) and Long Short-Term Memory (LSTM) architectures (<xref ref-type="bibr" rid="B26">26</xref>). However, although the advances in this field are promising, most of the published literature lacks a subject-oriented approach in the Artificial Intelligence (AI) implementation and evaluation, limiting the impact that these algorithms can have on people&#x0027;s lives.</p>
<p>Currently, there is a scenario where the arrival of DIY tools embraced by people with T1D, the promising advances of AI in glucose forecasting, and the progress in the mHealth field do not fully converge, thus limiting the implementation of such systems in the healthcare programs (<xref ref-type="bibr" rid="B27">27</xref>). Additionally, data privacy has become one of the main concerns of the users when using personal and clinical data in mobile applications (<xref ref-type="bibr" rid="B28">28</xref>), which is related to the reservations of using them daily (<xref ref-type="bibr" rid="B29">29</xref>). Thus, the proposed AI-based DIY framework (<xref ref-type="fig" rid="F1">Figure&#x00A0;1</xref>) intends to merge these advances and overcome these limitations, contributing in terms of AI model personalization and data privacy to enhance T1D self-management including the following features:
<list list-type="simple">
<list-item><label>a.</label>
<p>Robust validation approach of fully personalized AI-based models (using only the user&#x0027;s own data) to make 30- and 60-min interstitial glucose forecasting, based on the state-of-the-art architectures using 1 year of CGM data.</p></list-item>
<list-item><label>b.</label>
<p>Integration of the DL workflow in a DIY module for software developers that includes personalization in the way T1D data is shown to the user.</p></list-item>
<list-item><label>c.</label>
<p>AI-related information, targeting user empowerment in the use of AI, informing them about the relationship between their data and the AI models generated (e.g., why a DL model cannot be reliably trained with the provided data) (<xref ref-type="bibr" rid="B30">30</xref>).</p></list-item>
<list-item><label>d.</label>
<p>Secure design that enables the local generation and execution of the DL model in the user&#x0027;s own device, avoiding sharing personal data with third parties.</p></list-item>
<list-item><label>e.</label>
<p>Open-source modular design that allows researchers and developers the integration of data from new sensors, preprocessing stages, or additional DL architectures in a straightforward way.</p></list-item>
</list></p>
<fig id="F1" position="float"><label>Figure 1</label>
<caption><p>Proposed AI-based DIY framework for interstitial glucose level prediction up to 30 and 60&#x2005;min in people with T1D. Framework steps are illustrated in order. The zone delimited by dashed lines is only executed once: in the user&#x0027;s first use. Out of this zone, the steps that the user will perform every time he/she uses the DIY module are illustrated. For the analysis presented in this work, this framework has been executed once per included subject (<italic>n</italic>&#x2009;&#x003D;&#x2009;29). After the first use, the module is designed to, every time the user &#x201C;triggers&#x201D; it, automatically read the last day of the available CGM data and provide an immediate 30- or 60-min prediction. Currently, if there are CGM readings interruptions, a prediction is not provided. <bold>(a)</bold> In the first use, the users upload the raw CGM data to generate the DL model as data were downloaded by the corresponding application. In subsequent uses, user allows the Reading of the last day of data to perform a prediction. <bold>(b)</bold> Automatic data analysis and preparation is performed to check if the provided data allows a reliable AI model generation or not. If so, data is prepared to train and validate the model. <bold>(c)</bold> Min-max normalization and 4-fold trimester-wise data partition. <bold>(d)</bold> AI model generation after fold shuffling, train, validation, model evaluation, and best model selection. <bold>(e)</bold> Illustration of subsequent module uses, including interstitial glucose prediction and data visualization.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fdgth-07-1534830-g001.tif"/>
</fig>
<p>To the best of our knowledge, this work proposes the first personalized AI-based DIY module for both software developers and people with T1D to aid the latter with their daily self-management by providing up to one-hour interstitial glucose level forecasting. The design of this module allows its easy integration on a smartphone, even if it only has been tested on a computer. For the sake of usability improvement and user engagement, this tool has been designed considering the daily habits of people with T1D regarding their glycemic control, and the challenges they usually face through a co-creation process. Besides, this has been achieved following a robust methodology to train and technically validate the DL models, using 1 year of CGM data, and a global and subject-wise evaluation. This module automatically analyses the individual&#x0027;s data, trains, and validates a fully personalized DL model once the user has uploaded her/his CGM data. As a result, the user obtains a detailed visualization of their data in a standardized but customizable manner, as well as a forecast of her/his interstitial glucose level. If a hypo- or hyperglycemic episode is predicted, a warning message will be triggered.</p>
</sec>
<sec id="s2"><label>2</label><title>Materials and methods</title>
<sec id="s2a"><label>2.1</label><title>T1D dataset</title>
<p>CGM data were collected at the <italic>Complejo Hospitalario Insular-Materno Infantil de Las Palmas de Gran Canaria</italic> from 41 people with T1D that use a sensor from the FreeStyle Libre (Abbott) family. Additional data, such as physical activity, insulin administration, or carbohydrates, were not available for any of the subjects involved in this study. The raw data were extracted from the LibreView<sup>TM</sup> (Abbott) website by an endocrinologist in raw Comma-Separated Values (CSV) format. Participants were invited to participate and were given oral and written information. All participants signed a written informed consent form. Individual&#x0027;s data were stored on a secure server only accessible through a virtual private network by people working on the WARIFA project (<xref ref-type="bibr" rid="B31">31</xref>) after being given individual access credentials.</p>
<p><xref ref-type="sec" rid="s11">Supplementary Table S2</xref> summarizes each subject&#x0027;s more relevant information regarding AI processing associated with an anonymous ID. To train DL models, a sufficient number of samples for each subject is needed. Among the 41 subjects there were cases in which this requirement was not fulfilled, due to sensor malfunction or due to multiple sensor replacements in a short period of time. Moreover, different sampling periods in the sensors could imply variations in the considered architectures. Thus, only the subjects that met the following inclusion criteria were considered in this study:
<list list-type="simple">
<list-item><label>1.</label>
<p>To have at least 1 year of CGM readings with the same sensor. Sensor malfunction (e.g., reading interruptions) was considered and further treated to conform the instances to train and validate the DL models.</p></list-item>
<list-item><label>2.</label>
<p>To have a glucose sensor with a sampling period of 15&#x2005;min, aiming a fair prediction performance comparison between different subjects.</p></list-item>
</list>Finally, 29 subjects met the inclusion criteria, for whom it was used the oldest year (when more available) of these subjects to train and validate the personalized AI-models. The oldest year was selected so subsequent CGM readings were left for potential further testing of the DL models. Besides, when available, additional data were collected for a final model test.</p>
</sec>
<sec id="s2b"><label>2.2</label><title>CGM data preparation and preprocessing</title>
<p>The data curation phase was performed by filtering out the subjects that did not meet the inclusion criteria previously described. The framework was executed one time per included subject (i.e., 29 times) using the first recorded year of each subject. At this point, there was a unique sequence of CGM readings for each subject with their associated timestamps to which a pre-processing step was applied. At that point, data were still not suitable for the training of the DL models.</p>
<p>Then, an automatic and parametric subject-per-subject sequence-to-sequence (from now, <italic>seq-to-seq</italic>) (i.e., an input sequence and an output sequence) dataset generation was developed (<xref ref-type="fig" rid="F1">Figure&#x00A0;1B</xref>). The considered parameters were the <italic>window length</italic>, denoted as <italic>N</italic> (96 in this work), the <italic>step</italic> from one sequence to the next one (set to one in this case), and <italic>prediction steps</italic>, which is the result of the division between the Prediction Horizon (PH), i.e., how far ahead the model predicts, and the sensor sampling period. For this case, this parameter was set to four and two (60- and 30-min PH/15&#x2005;min sampling period, respectively). Notice that, with this approach, there is a trade-off between the window input length and number of training instances; a larger input length will likely provide more information to the DL model, but fewer training instances will be generated, potentially limiting the prediction performance.</p>
<p>Firstly, the time intervals between two consecutive readings were computed considering the sensor timestamps associated with all readings. Although the nominal sampling period of all the sensors included in this work is 15&#x2005;min, the actual interval between consecutive samples may vary from this reference value (<xref ref-type="sec" rid="s11">Supplementary Figure S10</xref>). Therefore, to be compliant with the assumption of data provided in periodic time slots, two samples are actually consecutive when the time between them is lower than twice the sampling period (i.e., 30&#x2005;min). As depicted in <xref ref-type="sec" rid="s11">Supplementary Figure S6</xref>, it is assumed that, if the sensor reading is delayed or advanced in 2&#x2009;&#x00D7;&#x2009;sampling period minus 1&#x2005;s (i.e., 29:59&#x2005;min), that reading corresponds to the next timeslot.</p>
<p>Every time that two consecutive samples in the CGM sequence surpassed 29:59&#x2005;min, a new data block was created. Therefore, the number of blocks depends on the number and location of interruptions in the data (<xref ref-type="fig" rid="F1">Figure&#x00A0;1B</xref>). Furthermore, the minimum number of consecutive samples to form a usable block (i.e., to form an instance suitable to train the DL models) is equal to the length of the input sequence plus the length of the output sequence. Otherwise, those samples are discarded and will not be used to generate and train the AI models. Notice that the ideal case would be to have only one data block without interruptions. After the data block generation, each data block is swept into steps of one to generate the model inputs (<italic>X</italic>) and the associated outputs (<italic>Y</italic>). Thus, block length determines the number of instances a particular block provides. After the sequences were generated from all data blocks, they are concatenated as instances to perform the min-max normalization as described in <xref ref-type="disp-formula" rid="disp-formula1">Equation&#x00A0;1</xref>.<disp-formula id="disp-formula1"><label>(1)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM1"><mml:msub><mml:mi>i</mml:mi><mml:mrow><mml:mi>n</mml:mi><mml:mi>o</mml:mi><mml:mi>r</mml:mi><mml:mi>m</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mfrac><mml:mrow><mml:mi>i</mml:mi><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mi>S</mml:mi><mml:mrow><mml:mi>m</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:msub><mml:mi>S</mml:mi><mml:mrow><mml:mi>m</mml:mi><mml:mi>a</mml:mi><mml:mi>x</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mspace width="thickmathspace" /><mml:msub><mml:mi>S</mml:mi><mml:mrow><mml:mi>m</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfrac></mml:mrow><mml:mo>,</mml:mo></mml:mstyle></mml:math></disp-formula>where <italic>i</italic> represents a given sample <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM1"><mml:msub><mml:mi>i</mml:mi><mml:mrow><mml:mi>n</mml:mi><mml:mi>o</mml:mi><mml:mi>r</mml:mi><mml:mi>m</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> is the normalized sample, and <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM2"><mml:msub><mml:mi>S</mml:mi><mml:mrow><mml:mi>m</mml:mi><mml:mi>a</mml:mi><mml:mi>x</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> and <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM3"><mml:msub><mml:mi>S</mml:mi><mml:mrow><mml:mi>m</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> the global maximum and minimum values of a subject&#x0027;s data.</p>
<p>Additionally, there were a few cases where the CSV file did not follow LibreView&#x0027;s standard way of presenting the data. In such cases, glucose concentration values were considered corrupted, and thus treated as interruptions.</p>
</sec>
<sec id="s2c"><label>2.3</label><title>ISO adapted loss function</title>
<p>ISO 15197:2015 (<xref ref-type="bibr" rid="B32">32</xref>) establishes two specific criteria for glucose concentration monitoring systems, both based on the discrepancy between measured values and their reference counterparts. Although this standard was developed for glucose sensor measurement errors, its criteria can be extrapolated to evaluate errors between the actual glucose concentration and a value predicted by a model, tailoring the prediction problem assessment to the glucose monitoring context. AI-based models, such as those proposed in this work, are often trained with the aim of minimizing standard loss functions based on squared or absolute errors. Although theoretically both approaches lead to the same optimal solution, in practice a better result is expected if the loss functions are adapted to the required validation performance. A customized loss function has therefore been designed to enforce compliance with the criteria specified in the ISO standard.</p>
<p>Firstly, the two validation criteria, i.e., the one referring to the acceptable error zone in terms of accuracy and the one attending to regions A and B in the Consensus Error Grid [CEG&#x2014;also called Parkes Error Grid (PEG)] (<xref ref-type="bibr" rid="B24">24</xref>, <xref ref-type="bibr" rid="B26">26</xref>), have been analyzed by comparing the maximum admissible error values for each case. As shown in <xref ref-type="sec" rid="s11">Supplementary Figure S7</xref>, the former criterion is the most restrictive except in the narrow range of reference values from 164 to 174&#x2005;mg/dl, where the maximum admissible error is established by the boundary of region A in the CEG. Hence, it could be assumed that error values of 15&#x2005;mg/dl or 15&#x0025; of the reference value, depending on whether the actual concentration is less than 100&#x2005;mg/dl or not, respectively, define the upper bound of the admissible error.</p>
<p>The strategy for designing an error function explicitly considering this upper bound is to force a barrier in the form of a steep slope of the function in the neighborhood of the threshold value. This can be achieved by introducing an additive term to the quadratic error that can be considered negligible (ideally zero) in the admissible region but large (ideally infinite) elsewhere. Nevertheless, the desirable properties of the error function must be preserved to facilitate the optimization process of AI model training, specifically its increasing monotonicity with the magnitude of the error and its smoothness. It is inspired by the design of low-pass filters, where the constraints are similar, with a low attenuation in the admissible region and a cut-off value beyond which the attenuation is high. Therefore, the additive term <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM4"><mml:mi>&#x03B3;</mml:mi></mml:math></inline-formula> shown in the following <xref ref-type="disp-formula" rid="disp-formula2">Equation&#x00A0;2</xref> is proposed:<disp-formula id="disp-formula2"><label>(2)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM2"><mml:mi>&#x03B3;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>&#x03F5;</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:mi>K</mml:mi><mml:msup><mml:mi>&#x03F5;</mml:mi><mml:mrow><mml:mn>2</mml:mn><mml:mi>n</mml:mi></mml:mrow></mml:msup></mml:math></disp-formula>where the variable <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM5"><mml:mi>&#x03F5;</mml:mi></mml:math></inline-formula> refers to the normalised error in the prediction of a sample, i.e., the error itself if less than 100&#x2005;mg/dl or the error multiplied by <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM6"><mml:mspace width="thickmathspace" /><mml:mrow><mml:mfrac><mml:mrow><mml:mn>100</mml:mn></mml:mrow><mml:mi>r</mml:mi></mml:mfrac></mml:mrow></mml:math></inline-formula>, being <italic>r</italic> the reference value associated with that sample, and <italic>K</italic> is the proper constant to conform the transition in a way that the term remains below a prescribed tolerance in the admissible region and surpasses an established threshold for large error values.</p>
<p>The overall expression for the error function (<inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM7"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>), including the quadratic error and the additive term <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM8"><mml:mi>&#x03B3;</mml:mi></mml:math></inline-formula> is detailed in <xref ref-type="disp-formula" rid="disp-formula3">Equation&#x00A0;3</xref>.<disp-formula id="disp-formula3"><label>(3)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM3"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>&#x03F5;</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:mspace width="thickmathspace" /><mml:msup><mml:mi>&#x03F5;</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:mi>&#x03B3;</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mi>&#x03F5;</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:mspace width="thickmathspace" /><mml:msup><mml:mi>&#x03F5;</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:mi>K</mml:mi><mml:mspace width="thickmathspace" /><mml:msup><mml:mi>&#x03F5;</mml:mi><mml:mrow><mml:mn>2</mml:mn><mml:mi>n</mml:mi></mml:mrow></mml:msup></mml:math></disp-formula><xref ref-type="fig" rid="F2">Figure&#x00A0;2</xref> highlights the different behavior of <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM9"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> with respect to the squared error around the 15&#x2005;mg/dl limit prescribed in ISO 15197:2015. Its steeper slope enhances the reduction of the error for non-compliant samples compared to those already within the acceptable range.</p>
<fig id="F2" position="float"><label>Figure 2</label>
<caption><p>Basis of the development of the <italic>L</italic><sub>ISO</sub> loss function design. <bold>(a)</bold> Conventional squared error vs ISO 15197:2015 customized squared error in linear scale. <bold>(b)</bold> Conventional squared error vs ISO 15197: 2015 customized squared error in logarithmic scale. Error losses are plotted as functions of the Blood Glucose (BG) difference, i.e., the deviation of the test (predicted) glucose concentration from the reference (ground truth) value, expressed in mg/dl or percentage of the reference value according to the ISO standard. Similar behavior of both error functions is observed in the admissible range, delimited by red dashed lines.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fdgth-07-1534830-g002.tif"/>
</fig>
<p>This function should be considered as a modified version of the quadratic error of a sample and therefore allows composing loss functions for collections of samples by addition or averaging as well as the use of its square root to work in the same units in which the error is defined (mg/dl in the case of interstitial glucose concentration prediction). In this work, <italic>n</italic> has been set to 40, and <italic>K</italic> set to 0.1/14<sup>80</sup>.</p>
</sec>
<sec id="s2d"><label>2.4</label><title>Proposed AI-based framework</title>
<p><xref ref-type="fig" rid="F1">Figure&#x00A0;1</xref> shows the proposed framework to develop a personalized AI-based DIY module for interstitial glucose forecasting for people with T1D. It has been developed in Python 3.10.13 (<xref ref-type="bibr" rid="B33">33</xref>), using TensorFlow 2.10.0 (<xref ref-type="bibr" rid="B34">34</xref>) for the development of the DL models. This work was developed using an AMD Ryzen 5 3600 6-core processor and an NVIDIA GeForce RTX 4070 Ti GPU to speed up the training process of the large number of models that were generated. The choice of this approach was based on the following ideas:
<list list-type="simple">
<list-item><label>a.</label>
<p>the robustness of the DL models in the training and validation phase, considering different groups of three months within a year to train and validate the models.</p></list-item>
<list-item><label>b.</label>
<p>the adaptation of the forecasting problem to the CGM case [e.g., adapting the loss function used to train the DL models based on the ISO 15197:2015 (<xref ref-type="bibr" rid="B32">32</xref>)].</p></list-item>
<list-item><label>c.</label>
<p>the development of a fully personalized AI-based DIY module to predict interstitial glucose, preserving individuals&#x0027; privacy and considering the daily habits of self-management of T1D.</p></list-item>
<list-item><label>d.</label>
<p>the enhancement of the usability of this AI-based module (<xref ref-type="bibr" rid="B17">17</xref>) to either easily integrate it in a broader application environment and workflow or use it as a standalone tool.</p></list-item>
</list>Normally, each glucose sensor can be read with a dedicated reader or an application in the user&#x0027;s mobile phone, provided by the manufacturer. If interested, users can also have access to their raw data, which they can download. In a DIY approach, it is assumed that the users will download and deal with their data. Hence, this framework automatically reads the raw CSV data provided by the endocrinologist (in the final application would be the user itself who would upload his/her data) and prepares them to be further processed without the need for more interaction by the user.</p>
</sec>
<sec id="s2e"><label>2.5</label><title>Deep learning architectures</title>
<p>For the interstitial glucose forecasting, a <italic>seq-to-seq</italic> approach (<xref ref-type="bibr" rid="B35">35</xref>) was proposed due to its proven effectiveness in time series forecasting (<xref ref-type="bibr" rid="B36">36</xref>). In the <italic>seq-to-seq</italic> approach, the input of the model is one sequence (or more) of a certain length, and the model outputs a sequence of a certain length (usually shorter than the input for time series forecasting) that represents the subsequent time instants in the nearest future.</p>
<p>As a first approximation, the input sequence length was set as to 96 samples [i.e., 24&#x2005;h at a sampling period of 15&#x2005;min, which corresponds to an average period that includes basal glucose regulation mechanisms (<xref ref-type="bibr" rid="B37">37</xref>)]. This was established considering that all CGM sensors included in this study had a sampling period of 15&#x2005;min, based on clinical knowledge, subject&#x0027;s autocorrelation studies, and considering the trade-off between the input length and the number of generated training instances. As a second input, the first difference of the CGM input window was computed to feed the DL models with additional information about CGM variations. Besides, two different PHs, have been assessed: 30- and 60-min PHs. Having a sampling period of 15&#x2005;min implies an output sequence of two and four samples, respectively.</p>
<p>The proposed DL models were based on CNNs (<xref ref-type="bibr" rid="B38">38</xref>), and LSTMs (<xref ref-type="bibr" rid="B39">39</xref>), due to their promising results reported in time series forecasting, and specifically, in glucose levels forecasting (<xref ref-type="bibr" rid="B24">24</xref>&#x2013;<xref ref-type="bibr" rid="B26">26</xref>, <xref ref-type="bibr" rid="B40">40</xref>). Three different DL models, together with a baseline model, have been evaluated in this work:
<list list-type="simple">
<list-item><label>1.</label>
<p><italic>Na&#x00EF;ve</italic>: For the sake of comparison, a na&#x00EF;ve forecasting (<xref ref-type="bibr" rid="B24">24</xref>) approach was included in the study. It consists of making the prediction by outputting the last values of the input sequence. This elementary prediction is considered the baseline to compare the performance of the proposed DL-based models.</p></list-item>
<list-item><label>2.</label>
<p><italic>LSTM</italic>: A single LSTM cell with <italic>N</italic> memory units, <italic>N</italic> being the input sequence length (set to 96 samples), followed by a fully connected layer, whose output dimension is equal to the number of predicted points.</p></list-item>
<list-item><label>3.</label>
<p><italic>Stacked-LSTM</italic>: A Stacked-LSTM (i.e., a model that comprises several LSTM cells) (<xref ref-type="bibr" rid="B36">36</xref>) composed by five layers in an encoder scheme of <italic>N, N/2, N/2,N/4</italic> and <italic>N/4</italic> memory units, from the outer to the inner layer respectively. The intention underlying this architecture is to learn the longer-term features in the layers closer to the input, and the more local temporal dependencies at the layers closer to the output. A drop-out (<xref ref-type="bibr" rid="B41">41</xref>) of 0.05 was added to contemplate the randomness of the studied phenomena and to avoid overfitting on the training set (<xref ref-type="bibr" rid="B42">42</xref>). The LSTM cells are followed by a fully connected layer whose output size is equal to the number of predicted points.</p></list-item>
<list-item><label>4.</label>
<p><italic>Dil-UNet</italic>: Inspired by the promising results of the U-Net one-dimensional heart sound segmentation (<xref ref-type="bibr" rid="B43">43</xref>), and in the successful use of CNN with dilated convolutions (<xref ref-type="bibr" rid="B25">25</xref>), a regression model based on a dilated U-Net has been proposed. It consists of a four-stage encoding-decoding network, with the hyperparameters outlined in <xref ref-type="sec" rid="s11">Supplementary Table S1</xref>. The number of filters of the first layer was set to 4 times the number of input features. They were doubled in each encoding stage of the network and halved in its decoding part. Besides, after the last encoding convolutional layer, there are two intermediate layers that double its number of filters. There are skip connections between each encoding-decoding peer to enable direct transfer of information. The dilation rate of the convolution was added to augment the receptive field of the operations and was set to one. As with the Stacked-LSTM, several drop-out layers were added, increasing the rate to 0.1 due to the greater number of weights of this model. The last convolutional layer was connected to a fully connected layer whose output dimension is equal to the number of predicted points.</p></list-item>
</list><xref ref-type="sec" rid="s11">Supplementary Table S1</xref> shows the model and training hyperparameters chosen for each architecture, which have been heuristically chosen after several trial-and-error experiments with subjects that were considered to represent the best, worst, and average subjects in terms of prediction performance. It also shows the number of parameters of each model. Notice that, due to the variation of the dense layer size that outputs the prediction sequence in the different PHs, there is a slight variation in this number for each PH. Due to the time constraints associated with the large number of independent models (one for each subject) generated in this study, hyperparameter optimization was not feasible. Notice that the training hyperparameters were the same for all architectures, seeking a fair prediction performance comparison. The batch size was set to one to compensate for the low number of samples of some of the included subjects.</p>
<p>Adam optimizer was used to train the models, using the standard Mean Squared Error (MSE) as the loss function, as well as using the novel <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM10"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> loss previously described. Due to the extensive computational time associated with the large number of generated models in this experiment, early stopping was implemented after two epochs without reducing the loss function. The delta, (i.e., the minimum change required in the loss function value to consider a model improvement) was set to 0.0001 for both loss functions aiming at a fair comparative. This delta was considered the optimum after heuristic experimentation. In the same way, it was noticed that the models performed better when not only the CGM was considered as input, but also the CGM&#x0027;s first difference. Experiments also showed that introducing the second difference worsened the prediction performance. Hence, the DL models had two input features: the CGM and its first difference.</p>
<p>Finally, considering that hypoglycemic events are a severe health threat, the output sequences that contained samples in the hypoglycemic range were weighted the most to train the DL models, followed by the output sequences containing samples in the hyperglycemic range. Sequences that were within the target CGM range were not weighted beyond considering its occurrence including its probability in the equation. Besides, the occurrence of hypoglycemic samples is lower than the hyper- and normal CGM ranges. This together with the fact that such occurrence varies among subjects, the abovementioned weighted factor was multiplied by the probability of a given sample to be in range, or in the hyper- and hypo- ranges. This introduces the models&#x0027; personalization from the training process. Depending on the number of samples in the different ranges, the weighting varies. Generally, the samples to train the models were weighted as described in <xref ref-type="disp-formula" rid="disp-formula4">Equations&#x00A0;4</xref>&#x2013;<xref ref-type="disp-formula" rid="disp-formula6">6</xref> for output sequences that contained hypo-, hyperglycemic samples, and samples that were in the target range, respectively. The weights multiplying the inverse of the probability of occurrence were obtained heuristically.<disp-formula id="disp-formula4"><label>(4)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM4"><mml:msub><mml:mi>W</mml:mi><mml:mrow><mml:mi>h</mml:mi><mml:mi>y</mml:mi><mml:mi>p</mml:mi><mml:mi>o</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn>2</mml:mn><mml:mspace width="thickmathspace" /><mml:mi>x</mml:mi><mml:mspace width="thickmathspace" /><mml:mn>1</mml:mn><mml:mrow><mml:mo>/</mml:mo></mml:mrow><mml:mi>p</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>h</mml:mi><mml:mi>y</mml:mi><mml:mi>p</mml:mi><mml:mi>o</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:math></disp-formula><disp-formula id="disp-formula5"><label>(5)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM5"><mml:msub><mml:mi>W</mml:mi><mml:mrow><mml:mi>h</mml:mi><mml:mi>y</mml:mi><mml:mi>p</mml:mi><mml:mi>e</mml:mi><mml:mi>r</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn>1.1</mml:mn><mml:mspace width="thickmathspace" /><mml:mi>x</mml:mi><mml:mspace width="thickmathspace" /><mml:mn>1</mml:mn><mml:mrow><mml:mo>/</mml:mo></mml:mrow><mml:mi>p</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>h</mml:mi><mml:mi>y</mml:mi><mml:mi>p</mml:mi><mml:mi>e</mml:mi><mml:mi>r</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:math></disp-formula><disp-formula id="disp-formula6"><label>(6)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM6"><mml:msub><mml:mi>W</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mspace width="thickmathspace" /><mml:mi>r</mml:mi><mml:mi>a</mml:mi><mml:mi>n</mml:mi><mml:mi>g</mml:mi><mml:mi>e</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mrow><mml:mo>/</mml:mo></mml:mrow><mml:mi>p</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mspace width="thickmathspace" /><mml:mi>r</mml:mi><mml:mi>a</mml:mi><mml:mi>n</mml:mi><mml:mi>g</mml:mi><mml:mi>e</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:math></disp-formula>Where <italic>W</italic> represents the weights for a given subject&#x0027;s hypoglycemic (<inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM11"><mml:msub><mml:mi>W</mml:mi><mml:mrow><mml:mi>h</mml:mi><mml:mi>y</mml:mi><mml:mi>p</mml:mi><mml:mi>o</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>), hyperglycaemic <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM12"><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>W</mml:mi><mml:mrow><mml:mi>h</mml:mi><mml:mi>y</mml:mi><mml:mi>p</mml:mi><mml:mi>e</mml:mi><mml:mi>r</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>) and in-range (<inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM13"><mml:msub><mml:mi>W</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mspace width="thickmathspace" /><mml:mi>r</mml:mi><mml:mi>a</mml:mi><mml:mi>n</mml:mi><mml:mi>g</mml:mi><mml:mi>e</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>) sample, and <italic>p</italic> refers to the probabilities of a given sample to belong to the hypoglycemic range <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM14"><mml:mi>p</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>h</mml:mi><mml:mi>y</mml:mi><mml:mi>p</mml:mi><mml:mi>o</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:math></inline-formula>, hyperglycaemic range <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM15"><mml:mi>p</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>h</mml:mi><mml:mi>y</mml:mi><mml:mi>p</mml:mi><mml:mi>e</mml:mi><mml:mi>r</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:math></inline-formula>, and an in-range sample <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM16"><mml:mi>p</mml:mi><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mspace width="thickmathspace" /><mml:mi>r</mml:mi><mml:mi>a</mml:mi><mml:mi>n</mml:mi><mml:mi>g</mml:mi><mml:mi>e</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:math></inline-formula>. Notice that, for each subject, the probability is computed as the number of samples in each range divided by the total number of samples.</p>
</sec>
<sec id="s2f"><label>2.6</label><title>Trimester-wise 4-fold cross-validation</title>
<p>From the set of sequences collected, the data partition was conducted as depicted in <xref ref-type="fig" rid="F1">Figure&#x00A0;1C</xref>. To analyze if the performance of the different AI models depends on the period of the year used to train them, which can be related to sensor misfunction, holidays period, etc., the models were cross-validated using a 4-fold approach, where each fold contained data from a consecutive 3-month period. Hence, a 9-month period and a 3-month period were used for training and validation, respectively, for each fold. For every subject, the oldest timestamp marked the beginning of the first fold. The second, third, and fourth folds were generated adding 3, 6, and 9 months to the first timestamp, respectively. Notice that there were some instances that contained data from different days, and subsequently, from different months. For the sake of consistency, borderline instances that contained data from different folds were discarded for cross-validation. Furthermore, due to the heterogeneity in the sensor reading interruptions, there were folds with more instances than others. This could have an impact on the final regression performance of the models between folds from the same subject. Finally, every fold was shuffled before feeding the DL models.</p>
<p>Notice that every architecture was trained and validated with the standard MSE and the <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM17"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> loss functions, and this was performed for the 4 folds. Moreover, the same methodology was applied for two PHs: 30 and 60&#x2005;min. Hence, and taking into account that the na&#x00EF;ve approach does not need to be trained, for each subject, 48 AI models (3 architectures&#x2009;&#x00D7;&#x2009;2 loss functions&#x2009;&#x00D7;&#x2009;4 folds&#x2009;&#x00D7;&#x2009;2 PHs) were generated. Considering the 29 subjects, 1,392 personalized AI-based interstitial glucose forecasting models were generated and evaluated in this work. This large number of models strongly limited the number of experiments that could be performed following this approach.</p>
</sec>
<sec id="s2g"><label>2.7</label><title>Prediction evaluation metrics</title>
<p>Commonly, prediction models for interstitial glucose level forecasting are evaluated using classical regression evaluation metrics, such as Root Mean Squared Error (RMSE), Mean Absolute Error (MAE) or Mean Absolute Percentage Error (MAPE), described in <xref ref-type="disp-formula" rid="disp-formula7">Equations&#x00A0;7</xref>&#x2013;<xref ref-type="disp-formula" rid="disp-formula9">9</xref>, respectively, where <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM18"><mml:msub><mml:mrow><mml:mover><mml:mi>y</mml:mi><mml:mo stretchy="false">&#x005E;</mml:mo></mml:mover></mml:mrow><mml:mi>i</mml:mi></mml:msub></mml:math></inline-formula> is the forecasted value, <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM19"><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:math></inline-formula> the corresponding ground truth, and <italic>N</italic> the number of considered values. In this work, they have been also used. However, only a few studies in the literature report the results achieved using the CEG and, to the best of our knowledge, none of them uses the complete ISO 15197:2015 (<xref ref-type="bibr" rid="B32">32</xref>) criteria for such evaluation since it is a highly restricted evaluation metric.</p>
<p>ISO 15197 is an international standard on <italic>in vitro</italic> diagnostic test that addresses self-testing blood glucose monitoring systems for managing diabetes mellitus within the realm of <italic>in vitro</italic> diagnostic test systems. These systems are designed for self-measurement by individuals without specialized medical training for the purpose of managing their condition. This standard, which has been adapted from the sensor accuracy measurement to the error between the prediction and the actual value in this work, as mentioned before in the text, establishes that the blood glucose monitoring systems (in this work, extrapolated to prediction error), must meet these two criteria:
<list list-type="simple">
<list-item><label>&#x2022;</label>
<p>95&#x0025; of the measured (predicted) glucose values must be within &#x00B1;15&#x2005;mg/dl for blood glucose concentrations below 100&#x2005;mg/dl. For values equal or greater than 100&#x2005;mg/dl, the margin of error is percentage and is set at &#x00B1;15&#x0025;. This is illustrated in <xref ref-type="sec" rid="s11">Supplementary Figure S8a</xref>.</p></list-item>
<list-item><label>&#x2022;</label>
<p>99&#x0025; of the measured (predicted) glucose values should fall within zones A and B of the CEG for T1D. As shown in <xref ref-type="sec" rid="s11">Supplementary Figure S8b</xref>, the CEG is divided into 5 zones according to the estimated risk to the people with T1D if an outcome fails, starting with zone A, where there is no effect on clinical action, to zone E, where clinical action is altered with dangerous consequences.</p></list-item>
</list>Unlike the classic regression metrics, these have clinical meaning and penalize more the errors in clinically critical intervals (i.e., errors that imply misprediction of hypo- or hyperglycemia events), so they have been taken as a reference instead of the RMSE, as has been usually done (<xref ref-type="bibr" rid="B24">24</xref>&#x2013;<xref ref-type="bibr" rid="B26">26</xref>, <xref ref-type="bibr" rid="B44">44</xref>, <xref ref-type="bibr" rid="B45">45</xref>). Hence, in this work, two additional metrics that considered these two criteria were studied: the percentage of the total predicted points within the Parkes acceptable zone (<italic>ParkesAB</italic>), and within the ISO acceptable zone (<italic>ISOZone</italic>).<disp-formula id="disp-formula7"><label>(7)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM7"><mml:mi>R</mml:mi><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mo>=</mml:mo><mml:msqrt><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:mi>N</mml:mi></mml:mfrac></mml:mrow><mml:munderover><mml:mrow><mml:mo movablelimits="false">&#x2211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:munderover><mml:mo>&#x2061;</mml:mo><mml:msup><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mrow><mml:mover><mml:mi>y</mml:mi><mml:mo stretchy="false">&#x005E;</mml:mo></mml:mover></mml:mrow></mml:mrow><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mspace width="thickmathspace" /><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mstyle></mml:msqrt></mml:math></disp-formula><disp-formula id="disp-formula8"><label>(8)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM8"><mml:mi>M</mml:mi><mml:mi>A</mml:mi><mml:mi>E</mml:mi><mml:mo>=</mml:mo><mml:mspace width="thickmathspace" /><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:mi>N</mml:mi></mml:mfrac></mml:mrow><mml:munderover><mml:mrow><mml:mo movablelimits="false">&#x2211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:munderover><mml:mo>&#x2061;</mml:mo><mml:mo fence="false" stretchy="false">|</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mrow><mml:mover><mml:mi>y</mml:mi><mml:mo stretchy="false">&#x005E;</mml:mo></mml:mover></mml:mrow></mml:mrow><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mspace width="thickmathspace" /><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow><mml:mo fence="false" stretchy="false">|</mml:mo><mml:mspace width="thickmathspace" /></mml:mstyle></mml:math></disp-formula><disp-formula id="disp-formula9"><label>(9)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM9"><mml:mi>M</mml:mi><mml:mi>A</mml:mi><mml:mi>P</mml:mi><mml:mi>E</mml:mi><mml:mo>=</mml:mo><mml:mspace width="thickmathspace" /><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:mi>N</mml:mi></mml:mfrac></mml:mrow><mml:munderover><mml:mrow><mml:mo movablelimits="false">&#x2211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:munderover><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mfrac><mml:mrow><mml:mo fence="false" stretchy="false">|</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mrow><mml:mover><mml:mi>y</mml:mi><mml:mo stretchy="false">&#x005E;</mml:mo></mml:mover></mml:mrow></mml:mrow><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mspace width="thickmathspace" /><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow><mml:mo fence="false" stretchy="false">|</mml:mo></mml:mrow><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mfrac></mml:mrow><mml:mo>&#x2217;</mml:mo><mml:mn>100</mml:mn><mml:mspace width="thickmathspace" /><mml:mtext>&#x0025;</mml:mtext></mml:mstyle></mml:mstyle></mml:math></disp-formula></p>
</sec>
<sec id="s2h"><label>2.8</label><title>Do-it-yourself module design and containerization</title>
<p>After performing the personalized AI-models development and validation, a Python application was developed to encapsulate the DIY framework in a usable module. Additionally, the Docker tool (<xref ref-type="bibr" rid="B46">46</xref>, <xref ref-type="bibr" rid="B47">47</xref>) was used to containerize the app, enabling its use in different Operating Systems (OSs), including those used in smartphones. In this work, this module was validated in Windows 10 and Ubuntu LTS 24.04, to prove that this module was OS-agnostic. Only the LSTM for 30-min PH was implemented in this stage, since it was the model with the shortest training times, and this was sufficient to test the DIY module functionality.</p>
<p>The design of the application aimed to increase the users&#x0027; empowerment (<xref ref-type="bibr" rid="B30">30</xref>) regarding their data and the AI models generation using them. Considering the inclusion criteria, the preprocessing and the obtained results regarding prediction performance of this work, there are cases where the implementation of this AI-based framework is not feasible, e.g., to provide less than a year of data to generate the model, the fact that such year of data does not provide enough samples to properly train the DL architectures, etc. All this information will be prompted to the users when needed. The users will also have the option to skip this information in case they are not interested. Four main scenarios were considered for the design of this tool. A key point is that all these scenarios are triggered by the user by calling the application. In the current stage, this means uploading their CGM sensor data to the DIY module. The possible scenarios that the tool contemplate are:
<list list-type="simple">
<list-item><label>1.</label>
<p>User&#x0027;s first use providing enough data. The DL models are generated and training following a 4-fold cross-validation approach. The best model is selected and locally stored to be the one that will provide the personalized CGM predictions.</p></list-item>
<list-item><label>2.</label>
<p>User&#x0027;s first use without providing enough data. No DL model will be generated. The application will encourage the user to upload her/his again, indicating why user&#x0027;s data was not suitable for the CGM prediction (if desired).</p></list-item>
<list-item><label>3.</label>
<p>User&#x0027;s second (or beyond) use providing enough and uninterrupted data (i.e., one day with the proposed approach, as it is the input length of the DL models). The model generated in 1) is called and the CGM prediction is provided.</p></list-item>
<list-item><label>4.</label>
<p>User&#x0027;s second (or beyond) use and not providing enough data. No prediction will be provided, and, if the user wants so, an explanation about why the prediction did not take place will be provided.</p></list-item>
</list>The design of the module interface, including the graphics, was developed through a co-creation process. Potential users participated in focus groups, where they expressed their needs and preferences related to the module. One of the objectives of these sessions was to find the best way to represent the glucose data of the potential users. To achieve this, they were asked about their preferences and were shown examples of graphs. Participants chose the ones they found most useful for decision-making regarding their insulin dosage. A total of six focus groups were conducted with participants with T1D (<italic>n</italic>&#x2009;&#x003D;&#x2009;31).</p>
</sec>
</sec>
<sec id="s3" sec-type="results"><label>3</label><title>Results</title>
<sec id="s3a"><label>3.1</label><title>Validation of the proposed ISO-adapted loss functions for DL model training</title>
<p><xref ref-type="fig" rid="F3">Figure&#x00A0;3</xref> shows the comparison of the prediction performance when training the LSTM, Stacked-LSTM and Dil-UNet models with <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM20"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> (green) and the standard MSE (grey). Notice that the na&#x00EF;ve model does not require any training and hence any loss function. The upper part of <xref ref-type="fig" rid="F3">Figure&#x00A0;3</xref> illustrates the metrics for 30-min PH, and the lower part for 60-min PH. This evaluation was performed in terms of RMSE, (<xref ref-type="fig" rid="F3">Figures&#x00A0;3a,f</xref>), MAE, (<xref ref-type="fig" rid="F3">Figures&#x00A0;3b,g</xref>), MAPE, (<xref ref-type="fig" rid="F3">Figures&#x00A0;3c,h</xref>), <italic>ParkesAB</italic>, (<xref ref-type="fig" rid="F3">Figures&#x00A0;3d,i</xref>), and <italic>ISOZone</italic>, (<xref ref-type="fig" rid="F3">Figures&#x00A0;3e,j</xref>). They comprise the results obtained for the included 29 subjects. Notice that for RMSE, MAE, and MAPE, the lower their value, the better the prediction performance, zero being the ideal value. Conversely, <italic>ParkesAB</italic> and <italic>ISOZone</italic> are percentage metrics, where the ideal case would be to have 100&#x0025; of the points within the acceptable zones. Nonetheless, a <italic>ParkesAB</italic> value of 99&#x0025; and an <italic>ISOZone</italic> value of 95&#x0025; are compliant with the ISO 15197:2015 standard (<xref ref-type="bibr" rid="B32">32</xref>).</p>
<fig id="F3" position="float"><label>Figure 3</label>
<caption><p>Comparison of metric performance for the proposed loss functions: MSE and <italic>L</italic><sub>ISO</sub>. Boxplots of the evaluation metrics in all subjects&#x2019; (<italic>n</italic>&#x2009;&#x003D;&#x2009;29) four validation folds in the three proposed DL models training them with the standard MSE (grey) and the <italic>L</italic><sub>ISO</sub> function (green) for 30- (top) and 60-min (bottom) predictions. In the boxplots, centre line represents the median, box comprises second and third quartiles, whiskers extend up to 1.5 times the interquartile range, and circles denotes outliers. The na&#x00EF;ve model was not included because it does not require any training. The lower the RMSE, MAE and MAPE, the better the prediction performance. The higher the ISOZone and ParkesAB, the better the prediction performance. The dash lines represent the ISOZone and ParkesAB minimum requirements according to the ISO 15197:2015 standard. <bold>(a)</bold> RMSE, 30-min PH. <bold>(b)</bold> MAE, 30-min PH. <bold>(c)</bold> MAPE, 30-min PH. <bold>(d)</bold> ParkesAB, 30-min PH. <bold>(e)</bold> ISOZone, 30-min PH. <bold>(f)</bold> RMSE, 60-min PH. <bold>(g)</bold> MAE, 60-min PH. <bold>(h)</bold> MAPE, 60-min PH. <bold>(i)</bold> ParkesAB, 60-min PH. <bold>(j)</bold> ISOZone, 60-min PH.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fdgth-07-1534830-g003.tif"/>
</fig>
<p>These results show that the proposed <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM21"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> training provided a similar prediction performance than the standard MSE for all models and for both PHs. Both <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM22"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> and MSE showed higher variability for the 60-min PH (<xref ref-type="fig" rid="F3">Figures&#x00A0;3f&#x2013;j</xref>), than for the 30-min PH (<xref ref-type="fig" rid="F3">Figures&#x00A0;3a&#x2013;e</xref>). The 30-min prediction implies less uncertainty than the 60-min prediction and, therefore, both error magnitude and variability increase in the latter case. MSE and <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM23"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> training presented equivalent performance, although the median metrics in MSE metrics showed slightly better performance than <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM24"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>. In the case of the 60-min prediction, <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM25"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> training improves the Dil-UNet performance in terms of all metrics (<xref ref-type="fig" rid="F3">Figures&#x00A0;3f&#x2013;j</xref>). Besides, this improvement is the largest among all the models comparing both loss functions. Considering that the 60-min PH is a more complex task than the 30-min analogue, and that the Dil-UNet has around 15 and 8 times more parameters than LSTM and Stacked-LSTM respectively (see <xref ref-type="sec" rid="s11">Supplementary Table S1</xref>), this suggests that the larger the PH and the more complex the model, the more evident is the <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM26"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> influence in glucose forecasting. Besides, it can also be observed that the performance limitations inherent to the proposed DL architectures are not overcome by the use of any loss function. As an example, the use of <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM27"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> to train the Dil-UNet, improves the prediction performance compared to the MSE training, but it does not outperform the Stacked-LSTM or the LSTM.</p>
</sec>
<sec id="s3b"><label>3.2</label><title>Comparison between different models for personalized interstitial glucose forecasting</title>
<p><xref ref-type="table" rid="T1">Tables&#x00A0;1</xref>, <xref ref-type="table" rid="T2">2</xref> show the mean and Standard Deviation (SD) of the obtained results for 30-min and 60-min PHs, respectively, considering the four validation folds in all subjects (<italic>n</italic>&#x2009;&#x003D;&#x2009;29) for the four evaluated models. Results are grouped by the loss function used to train the DL models.</p>
<table-wrap id="T1" position="float"><label>Table 1</label>
<caption><p>Evaluation metrics in the validation folds for the proposed models for MSE and <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM28"><mml:msub><mml:mrow><mml:mi mathvariant="bold-italic">L</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi mathvariant="bold-italic">I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:mrow></mml:msub></mml:math></inline-formula> loss functions and the 30-min PH. Results are shown as mean&#x2009;&#x00B1;&#x2009;SD of the included subjects (<italic>n</italic>&#x2009;&#x003D;&#x2009;29). Results in bold font indicate the model with the best performance for a specific metric.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left" colspan="6"><bold>Loss function&#x2009;&#x003D;&#x2009;MSE</bold></th>
</tr>
<tr>
<th valign="top" align="left"><bold>Metric</bold></th>
<th valign="top" align="center" rowspan="2"><bold>RMSE (mg/dl)</bold></th>
<th valign="top" align="center" rowspan="2"><bold>MAE (mg/dl)</bold></th>
<th valign="top" align="center" rowspan="2"><bold>MAPE (&#x0025;)</bold></th>
<th valign="top" align="center" rowspan="2"><bold><italic>ParkesAB</italic> (&#x0025;)</bold></th>
<th valign="top" align="center" rowspan="2"><bold><italic>ISOZone</italic> (&#x0025;)</bold></th>
</tr>
<tr>
<th valign="top" align="left"><bold>Model</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left"><bold>Na&#x00EF;ve</bold><xref ref-type="table-fn" rid="table-fn2"><sup>a</sup></xref></td>
<td valign="top" align="center">26.74&#x2009;&#x00B1;&#x2009;3.86</td>
<td valign="top" align="center">19.50&#x2009;&#x00B1;&#x2009;3.00</td>
<td valign="top" align="center">12.63&#x2009;&#x00B1;&#x2009;2.02</td>
<td valign="top" align="center">99.41&#x2009;&#x00B1;&#x2009;0.48</td>
<td valign="top" align="center">71.91&#x2009;&#x00B1;&#x2009;5.67</td>
</tr>
<tr>
<td valign="top" align="left"><bold>LSTM</bold></td>
<td valign="top" align="center"><bold>21.86</bold>&#x2009;&#x00B1;&#x2009;<bold>2.87</bold></td>
<td valign="top" align="center"><bold>15.83</bold>&#x2009;&#x00B1;&#x2009;<bold>2.21</bold></td>
<td valign="top" align="center"><bold>10.28</bold>&#x2009;&#x00B1;&#x2009;<bold>1.57</bold></td>
<td valign="top" align="center">99.77&#x2009;&#x00B1;&#x2009;0.18</td>
<td valign="top" align="center"><bold>79.34</bold>&#x2009;&#x00B1;&#x2009;<bold>4.97</bold></td>
</tr>
<tr>
<td valign="top" align="left"><bold>Stacked-LSTM</bold></td>
<td valign="top" align="center">21.98&#x2009;&#x00B1;&#x2009;2.86</td>
<td valign="top" align="center">15.95&#x2009;&#x00B1;&#x2009;2.18</td>
<td valign="top" align="center">10.34&#x2009;&#x00B1;&#x2009;1.64</td>
<td valign="top" align="center">99.80&#x2009;&#x00B1;&#x2009;0.15</td>
<td valign="top" align="center">78.91&#x2009;&#x00B1;&#x2009;5.81</td>
</tr>
<tr>
<td valign="top" align="left"><bold>Dil-UNet</bold></td>
<td valign="top" align="center">24.46&#x2009;&#x00B1;&#x2009;3.14</td>
<td valign="top" align="center">18.28&#x2009;&#x00B1;&#x2009;2.42</td>
<td valign="top" align="center">11.08&#x2009;&#x00B1;&#x2009;1.38</td>
<td valign="top" align="center"><bold>99.84</bold>&#x2009;&#x00B1;&#x2009;<bold>0.15</bold></td>
<td valign="top" align="center">76.25&#x2009;&#x00B1;&#x2009;5.03</td>
</tr>
<tr>
<th valign="top" align="left" colspan="6"><bold>Loss function&#x2009;&#x003D;</bold>&#x2009;<inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM29"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula></th>
</tr>
<tr>
<th valign="top" align="left"><bold>Metric</bold></th>
<th valign="top" align="center" rowspan="2"><bold>RMSE (mg/dl)</bold></th>
<th valign="top" align="center" rowspan="2"><bold>MAE (mg/dl)</bold></th>
<th valign="top" align="center" rowspan="2"><bold>MAPE (&#x0025;)</bold></th>
<th valign="top" align="center" rowspan="2"><bold><italic>ParkesAB</italic> (&#x0025;)</bold></th>
<th valign="top" align="center" rowspan="2"><bold><italic>ISOZone</italic> (&#x0025;)</bold></th>
</tr>
<tr>
<th valign="top" align="left"><bold>Model</bold></th>
</tr>
<tr>
<td valign="top" align="left"><bold>Na&#x00EF;ve</bold><xref ref-type="table-fn" rid="table-fn2"><sup>a</sup></xref></td>
<td valign="top" align="center">26.74&#x2009;&#x00B1;&#x2009;3.86</td>
<td valign="top" align="center">19.50&#x2009;&#x00B1;&#x2009;3.00</td>
<td valign="top" align="center">12.63&#x2009;&#x00B1;&#x2009;2.02</td>
<td valign="top" align="center">99.41&#x2009;&#x00B1;&#x2009;0.48</td>
<td valign="top" align="center">71.91&#x2009;&#x00B1;&#x2009;5.67</td>
</tr>
<tr>
<td valign="top" align="left"><bold>LSTM</bold></td>
<td valign="top" align="center"><bold>22.05</bold>&#x2009;&#x00B1;&#x2009;<bold>2.94</bold></td>
<td valign="top" align="center"><bold>16.00</bold>&#x2009;&#x00B1;&#x2009;<bold>2.22</bold></td>
<td valign="top" align="center"><bold>10.35</bold>&#x2009;&#x00B1;&#x2009;<bold>1.53</bold></td>
<td valign="top" align="center">99.76&#x2009;&#x00B1;&#x2009;0.20</td>
<td valign="top" align="center"><bold>79.20</bold>&#x2009;&#x00B1;&#x2009;<bold>4.77</bold></td>
</tr>
<tr>
<td valign="top" align="left"><bold>Stacked-LSTM</bold></td>
<td valign="top" align="center">22.39&#x2009;&#x00B1;&#x2009;3.91</td>
<td valign="top" align="center">16.34&#x2009;&#x00B1;&#x2009;3.04</td>
<td valign="top" align="center">10.49&#x2009;&#x00B1;&#x2009;1.61</td>
<td valign="top" align="center">99.80&#x2009;&#x00B1;&#x2009;0.13</td>
<td valign="top" align="center">78.11&#x2009;&#x00B1;&#x2009;6.13</td>
</tr>
<tr>
<td valign="top" align="left"><bold>DIL-UNet</bold></td>
<td valign="top" align="center">24.84&#x2009;&#x00B1;&#x2009;3.30</td>
<td valign="top" align="center">18.60&#x2009;&#x00B1;&#x2009;2.58</td>
<td valign="top" align="center">11.23&#x2009;&#x00B1;&#x2009;1.49</td>
<td valign="top" align="center"><bold>99.83</bold>&#x2009;&#x00B1;&#x2009;<bold>0.15</bold></td>
<td valign="top" align="center">75.57&#x2009;&#x00B1;&#x2009;5.40</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="table-fn2"><label><sup>a</sup></label>
<p>Na&#x00EF;ve model does not require any training, but its metrics are placed to compare this baseline model to the rest of the proposed models.</p></fn>
</table-wrap-foot>
</table-wrap>
<table-wrap id="T2" position="float"><label>Table 2</label>
<caption><p>Evaluation metrics in the validation folds for the proposed models for MSE and <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM30"><mml:msub><mml:mrow><mml:mi mathvariant="bold-italic">L</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi mathvariant="bold-italic">I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:mrow></mml:msub></mml:math></inline-formula> loss functions and the 60-min PH. Results are shown as mean &#x00B1; SD of the included subjects (<italic>n</italic> &#x003D; 29). Results in bold font indicate the model with the best performance for a specific metric.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left" colspan="6">Loss function&#x2009;&#x003D;&#x2009;MSE</th>
</tr>
<tr>
<th valign="top" align="left">Metric</th>
<th valign="top" align="center" rowspan="2"><bold>RMSE (mg/dl)</bold></th>
<th valign="top" align="center" rowspan="2"><bold>MAE (mg/dl)</bold></th>
<th valign="top" align="center" rowspan="2"><bold>MAPE (&#x0025;)</bold></th>
<th valign="top" align="center" rowspan="2"><bold><italic>ParkesAB</italic> (&#x0025;)</bold></th>
<th valign="top" align="center" rowspan="2"><bold><italic>ISOZone</italic> (&#x0025;)</bold></th>
</tr>
<tr>
<th valign="top" align="left">Model</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left"><bold>Na&#x00EF;ve</bold><xref ref-type="table-fn" rid="table-fn4"><bold><sup>a</sup></bold></xref></td>
<td valign="top" align="center">44.64&#x2009;&#x00B1;&#x2009;6.78</td>
<td valign="top" align="center">33.18&#x2009;&#x00B1;&#x2009;5.31</td>
<td valign="top" align="center">21.75&#x2009;&#x00B1;&#x2009;3.66</td>
<td valign="top" align="center">96.17&#x2009;&#x00B1;&#x2009;2.03</td>
<td valign="top" align="center">50.61&#x2009;&#x00B1;&#x2009;6.01</td>
</tr>
<tr>
<td valign="top" align="left"><bold>LSTM</bold></td>
<td valign="top" align="center">38.50&#x2009;&#x00B1;&#x2009;5.13</td>
<td valign="top" align="center">28.58&#x2009;&#x00B1;&#x2009;3.96</td>
<td valign="top" align="center">18.39&#x2009;&#x00B1;&#x2009;2.88</td>
<td valign="top" align="center">97.68&#x2009;&#x00B1;&#x2009;1.36</td>
<td valign="top" align="center">55.29&#x2009;&#x00B1;&#x2009;6.35</td>
</tr>
<tr>
<td valign="top" align="left"><bold>Stacked-LSTM</bold></td>
<td valign="top" align="center"><bold>38.38</bold>&#x2009;&#x00B1;&#x2009;<bold>4.84</bold></td>
<td valign="top" align="center"><bold>28.33</bold>&#x2009;&#x00B1;&#x2009;<bold>3.59</bold></td>
<td valign="top" align="center"><bold>18.15</bold>&#x2009;&#x00B1;&#x2009;<bold>2.69</bold></td>
<td valign="top" align="center"><bold>97.79</bold>&#x2009;&#x00B1;&#x2009;<bold>1.23</bold></td>
<td valign="top" align="center"><bold>56.09</bold>&#x2009;&#x00B1;&#x2009;<bold>6.11</bold></td>
</tr>
<tr>
<td valign="top" align="left"><bold>Dil-UNet</bold></td>
<td valign="top" align="center">40.25&#x2009;&#x00B1;&#x2009;5.71</td>
<td valign="top" align="center">30.63&#x2009;&#x00B1;&#x2009;4.31</td>
<td valign="top" align="center">19.70&#x2009;&#x00B1;&#x2009;3.47</td>
<td valign="top" align="center">97.13&#x2009;&#x00B1;&#x2009;2.00</td>
<td valign="top" align="center">51.06&#x2009;&#x00B1;&#x2009;6.82</td>
</tr>
<tr>
<th valign="top" align="left" colspan="6">Loss Function&#x2009;&#x003D;&#x2009;<inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM31"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula></th>
</tr>
<tr>
<th valign="top" align="left"><bold>Metric</bold></th>
<th valign="top" align="center" rowspan="2"><bold>RMSE (mg/dl)</bold></th>
<th valign="top" align="center" rowspan="2"><bold>MAE (mg/dl)</bold></th>
<th valign="top" align="center" rowspan="2"><bold>MAPE (&#x0025;)</bold></th>
<th valign="top" align="center" rowspan="2"><bold><italic>ParkesAB</italic> (&#x0025;)</bold></th>
<th valign="top" align="center" rowspan="2"><bold><italic>ISOZone</italic></bold></th>
</tr>
<tr>
<th valign="top" align="left"><bold>Model</bold></th>
</tr>
<tr>
<td valign="top" align="left"><bold>Na&#x00EF;ve</bold><xref ref-type="table-fn" rid="table-fn4"><sup>a</sup></xref></td>
<td valign="top" align="center">44.64&#x2009;&#x00B1;&#x2009;6.78</td>
<td valign="top" align="center">33.18&#x2009;&#x00B1;&#x2009;5.31</td>
<td valign="top" align="center">21.75&#x2009;&#x00B1;&#x2009;3.66</td>
<td valign="top" align="center">96.17&#x2009;&#x00B1;&#x2009;2.03</td>
<td valign="top" align="center">50.61&#x2009;&#x00B1;&#x2009;6.01</td>
</tr>
<tr>
<td valign="top" align="left"><bold>LSTM</bold></td>
<td valign="top" align="center">38.52&#x2009;&#x00B1;&#x2009;5.18</td>
<td valign="top" align="center">28.60&#x2009;&#x00B1;&#x2009;3.92</td>
<td valign="top" align="center">18.44&#x2009;&#x00B1;&#x2009;2.90</td>
<td valign="top" align="center">97.67&#x2009;&#x00B1;&#x2009;1.31</td>
<td valign="top" align="center">55.19&#x2009;&#x00B1;&#x2009;6.56</td>
</tr>
<tr>
<td valign="top" align="left"><bold>Stacked-LSTM</bold></td>
<td valign="top" align="center"><bold>38.44</bold>&#x2009;&#x00B1;&#x2009;<bold>4.51</bold></td>
<td valign="top" align="center"><bold>28.44</bold>&#x2009;&#x00B1;&#x2009;<bold>3.29</bold></td>
<td valign="top" align="center"><bold>18.33</bold>&#x2009;&#x00B1;&#x2009;<bold>2.52</bold></td>
<td valign="top" align="center"><bold>97.77</bold>&#x2009;&#x00B1;&#x2009;<bold>1.07</bold></td>
<td valign="top" align="center"><bold>55.65</bold>&#x2009;&#x00B1;&#x2009;<bold>5.93</bold></td>
</tr>
<tr>
<td valign="top" align="left"><bold>DIL-UNet</bold></td>
<td valign="top" align="center">40.00&#x2009;&#x00B1;&#x2009;5.66</td>
<td valign="top" align="center">30.31&#x2009;&#x00B1;&#x2009;4.30</td>
<td valign="top" align="center">19.27&#x2009;&#x00B1;&#x2009;3.57</td>
<td valign="top" align="center">97.43&#x2009;&#x00B1;&#x2009;1.98</td>
<td valign="top" align="center">51.83&#x2009;&#x00B1;&#x2009;6.97</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="table-fn4"><label><sup>a</sup></label>
<p>Na&#x00EF;ve model does not require any training, but its metrics are placed to compare this baseline model to the rest of the proposed models.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>The three proposed DL models outperformed the na&#x00EF;ve approach (set as baseline for the minimum requirements regarding prediction performance) for all metrics and both PHs. These results show that, among the proposed DL models, there is no architecture that works optimally for both PHs. Moreover, LSTM-based models outperform the Dil-UNet for both loss functions and PHs. This might be related to the fact that a recurrent neural network as the LSTM and Stacked-LSTM are based on an architecture that implements memory cells that preserve their state over time, theoretically more suitable for time series prediction purposes than other architectures that are in principle more complex but are not specifically designed to catch the temporal dependencies (<xref ref-type="bibr" rid="B48">48</xref>). Besides, regardless of the employed loss function to train the models, LSTM showed slightly better prediction metrics for 30-min PH, whereas Stacked-LSTM, which has more parameters (see <xref ref-type="sec" rid="s11">Supplementary Table S1</xref>), did it for 60-min PH.</p>
<p>LSTM and Stacked-LSTM presented slightly better results when trained with the standard MSE than when trained with <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM32"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>. Focusing on the difference of all metrics, it is noticeable that <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM33"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> influences more the Stacked-LSTM than the LSTM. This could be related to the fact that the Stacked-LSTM possesses twice the number of parameters than LSTM (see <xref ref-type="sec" rid="s11">Supplementary Table S1</xref>) and hence is more &#x201C;flexible&#x201D; than the LSTM.</p>
<p>Finally, focusing on the diabetes-specific metrics, it is worth noticing that the <italic>ParkesAB</italic> criterion (i.e., to be greater than 99&#x0025;) was fulfilled by all models regardless of the loss function used for the 30-min PH. However, this requirement was not fulfilled for the 60-min PH. All models left from 2.3&#x0025; to 3&#x0025; below the minimum threshold. The <italic>ISOZone</italic> metric, which is the most restrictive requirement based on the ISO 15197:2015 standard (<xref ref-type="bibr" rid="B32">32</xref>), was not fulfilled in any case (i.e., to be greater than 95&#x0025;), for any of the PHs, being around 16&#x0025; and 39&#x0025; below the threshold for 30-min and 60-min PHs, respectively. This might be related to the architectural limitations of the proposed DL models.</p>
</sec>
<sec id="s3c"><label>3.3</label><title>Assessing inter- and intra-subject variability through a subject-wise evaluation</title>
<p>The results presented in the previous section provided insights about the overall differences between the DL models evaluated for interstitial glucose forecasting but did not consider the inter- and intra-subject variability (<xref ref-type="bibr" rid="B49">49</xref>, <xref ref-type="bibr" rid="B50">50</xref>). Due to the fact that this work presents a DL-based DIY module that follows a subject-oriented approach, an individual evaluation of the DL models that would derive in personalized AI feedback is essential. <xref ref-type="fig" rid="F4">Figures&#x00A0;4</xref>, <xref ref-type="fig" rid="F5">5</xref> shows the subject-wise diabetes-specific prediction metrics, namely <italic>ParkesAB</italic> and <italic>ISOZone</italic> metrics after training the models only with <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM34"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> loss functions for 30-min and 60-min PHs, respectively. <xref ref-type="sec" rid="s11">Supplementary Figure S2</xref>, <xref ref-type="sec" rid="s11">Supplementary Figure S3</xref> show the <italic>ParkesAB</italic> and <italic>ISOZone</italic> metrics after training with the MSE for 30- and 60-min PH, respectively, which are equivalent to those obtained after the <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM35"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> training. Subjects&#x0027; IDs were sorted by the number of available CGM samples to train and validate the DL models following the proposed 4-fold trimester-wise cross-validation approach. These two metrics have been analysed in detail because they contemplate the prediction errors that are clinically relevant and are specific for the interstitial glucose prediction task. Additionally, RMSE was also analysed for 30- and 60-min PH after training with both loss functions (<xref ref-type="sec" rid="s11">Supplementary Figure S4</xref>, <xref ref-type="sec" rid="s11">Supplementary Figure S5</xref>, respectively), since it is the metric that is usually taken as the reference to compare between different models in the literature.</p>
<fig id="F4" position="float"><label>Figure 4</label>
<caption><p>Boxplots representing subject-wise (<italic>n</italic>&#x2009;&#x003D;&#x2009;29) ISO-based prediction metrics (parkesAB and ISOZone) computed with the four validation folds (PH&#x2009;&#x003D;&#x2009;30&#x2005;min) for the na&#x00EF;ve model, LTSM, stacked-LSTM, and Dil-uNet after being trained with <italic>L</italic><sub>ISO</sub>. The subjects are sorted in descending order of available instances to train the models. In the boxplots, the centre line, the box limits and the whiskers represent the median, the upper and lower quartile and the 1.5&#x00D7; interquartile range, respectively. <bold>(a)</bold> ParkesAB. <bold>(b)</bold> ISOZone.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fdgth-07-1534830-g004.tif"/>
</fig>
<fig id="F5" position="float"><label>Figure 5</label>
<caption><p>Boxplots representing subject-wise (<italic>n</italic>&#x2009;&#x003D;&#x2009;29) ISO-based prediction metrics (parkesAB and ISOZone) computed with the four validation folds (PH&#x2009;&#x003D;&#x2009;60&#x2005;min) for the na&#x00EF;ve model, LTSM, stacked-LSTM, and Dil-uNet after being trained with <italic>L</italic><sub>ISO</sub>. The subjects are sorted in descending order of available instances to train the models. In the boxplots, the centre line, the box limits and the whiskers represent the median, the upper and lower quartile and the 1.5&#x00D7; interquartile range, respectively. <bold>(a)</bold> ParkesAB. <bold>(b)</bold> ISOZone.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fdgth-07-1534830-g005.tif"/>
</fig>
<p>From <xref ref-type="table" rid="T1">Tables&#x00A0;1</xref>, <xref ref-type="table" rid="T2">2</xref>, no significant differences are observed between the means in any of the evaluated metrics. In all cases, such differences are clearly lower than the average SD. This implies that there are not statistically significant differences in favor of any of the metrics.</p>
<p>It is worth noting that, although a sufficient number of samples is required to properly train a DL model, it can be observed that more CGM samples do not imply more accurate predictions in the proposed DL models. This effect is related to: (1) the glucose patterns heterogeneity among subjects (i.e., inter-subject variability) (<xref ref-type="bibr" rid="B49">49</xref>), specially in people with T1D (<xref ref-type="bibr" rid="B50">50</xref>); (2) the day-to-day CGM variability (i.e., intra-subject variability) (<xref ref-type="bibr" rid="B51">51</xref>); and (3) the various factors that influence the subject&#x0027;s glucose dynamics (such as insulin administration, subject metabolism, carbohydrate intake, physical activity) that are not contemplated in the proposed DL models training because only CGM data were employed in this study.</p>
<p>In concordance with the results exposed in the global validation (<xref ref-type="table" rid="T1">Table&#x00A0;1</xref>), in the vast majority of the cases the LSTM-based models presented better prediction performance in terms of RMSE (<xref ref-type="sec" rid="s11">Supplementary Figure S4</xref>, <xref ref-type="sec" rid="s11">Supplementary Figure S5</xref>) than the na&#x00EF;ve model for both PHs, even though for some subjects the na&#x00EF;ve model showed lower variability (e.g., subjects &#x0023;045, &#x0023;048, and &#x0023;068, <xref ref-type="sec" rid="s11">Supplementary Figure S4a</xref>). In the case of Dil-UNet, most of the cases presented lower median than the na&#x00EF;ve model but its strong dependency on the fold (i.e., high intra-subject variability) makes it a less robust model than the na&#x00EF;ve approach for a few subjects (e.g., subject &#x0023;48, <xref ref-type="sec" rid="s11">Supplementary Figure S4b</xref>). Dil-UNet showed the largest variability within the four validation folds for both PHs (<xref ref-type="sec" rid="s11">Supplementary Figure S4</xref>, <xref ref-type="sec" rid="s11">Supplementary Figure S5</xref>) in almost all subjects trained with both loss functions, with a few exceptions (e.g., subject &#x0023;004 and &#x0023;014, <xref ref-type="sec" rid="s11">Supplementary Figure S4a</xref>). This means that, in general and for both PHs, the Dil-UNet prediction performance is more dependent on the folds (i.e., more sensible to the intra-subject variability) than the LSTM-based models. Thus, the interstitial glucose prediction reliability depends more on the time of the year used for the model training, making it a less robust model in terms of RMSE than the LSTM-based models. This could be related to the fact that Dil-UNet has a significantly larger number of parameters than the other two models (see <xref ref-type="sec" rid="s11">Supplementary Table S1</xref>), so more samples might be needed to achieve better prediction performance.</p>
<p>The improvement presented by the proposed models compared to the na&#x00EF;ve model becomes more evident studying the <italic>ParkesAB</italic> metric for both PHs. The training of the DL models using both loss functions outperformed the na&#x00EF;ve approach, although in a few cases some models presented slightly higher variability (e.g., subject &#x0023;007, <xref ref-type="fig" rid="F4">Figure&#x00A0;4a</xref>). In the case of 30-min PH (<xref ref-type="fig" rid="F4">Figure&#x00A0;4a</xref>; <xref ref-type="sec" rid="s11">Supplementary Figure S2a</xref>), the only exceptions were subjects &#x0023;068 and &#x0023;058, which are the ones that had the fewest available samples for training. In the case of 60-min PH, the three DL models of the seven subjects with fewer samples (&#x0023;063, &#x0023;055, &#x0023;061, &#x0023;057 &#x0023;003, &#x0023;068, and &#x0023;058) presented equivalent <italic>ParkesAB</italic> (<xref ref-type="fig" rid="F5">Figure&#x00A0;5a</xref>; <xref ref-type="sec" rid="s11">Supplementary Figure S3a</xref>). This happened with the training of both functions, but it was more evident with <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM36"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> training. Apart from these exceptions related to the lack of enough samples, LSTM-based models always showed higher <italic>ParkesAB</italic>, and also Dil-UNet (except for subjects &#x0023;065 and &#x0023;046).</p>
<p>Prediction performance in terms of <italic>ParkesAB</italic> and <italic>ISOZone</italic> evidences the RMSE limitations to properly characterize the interstitial glucose forecasting model performance. Firstly, model variability among folds related to the lack of training samples showed by the diabetes-specific metrics was not reflected by RMSE. Besides, <italic>ParkesAB</italic> and <italic>ISOZone</italic> give more importance to samples that are clinically relevant (i.e., prediction errors of hypoglycemic and hyperglycemic events), it therefore provides more information on whether the prediction model is suitable for this specific task. As an example, comparing RMSE and <italic>ParkesAB</italic> metrics for the 30-min PH training with MSE loss function (<xref ref-type="sec" rid="s11">Supplementary Figure S4a</xref>, <xref ref-type="sec" rid="s11">Supplementary Figure S2a</xref>, respectively) of subjects &#x0023;067 and &#x0023;025, it is observed that &#x0023;067 presented lower RMSE (i.e., better prediction) in all models than subject &#x0023;025. Nonetheless, subject &#x0023;025 presented a higher <italic>ParkesAB</italic> (i.e., better prediction in the diabetes context). Hence, even though subject &#x0023;067 predictions showed a lower RMSE, the predictions of subject &#x0023;025 will be more clinically reliable and relevant. Thus, lower RMSE does not always imply better interstitial glucose predictions for people with T1D. This was consistent when comparing also the RMSE with <italic>ISOZone</italic> (Figures&#x00A0;4b,<xref ref-type="fig" rid="F5">5b</xref>; <xref ref-type="sec" rid="s11">Supplementary Figure S2b</xref>, <xref ref-type="sec" rid="s11">Supplementary Figure S3b</xref>).</p>
<p>Besides, even though more training samples do not ensure better prediction performance, obtained results have set a threshold regarding available training CGM samples to achieve a fairly reliable glucose prediction. Such threshold is different for each PH. Setting the limit where the na&#x00EF;ve approach (i.e., the predicted sequence consists of the last samples of the input) achieves equivalent <italic>ParkesAB</italic> and <italic>ISOZone</italic> in terms of median and SD than all three proposed DL models, the threshold for 30-min PH is &#x223C;1,500 CGM training samples, whereas for 60-min PH it is &#x223C;5,000. Such a difference might be related to the complexity of the task. A more complex prediction requires, in principle, more training samples to properly learn the phenomenon. This phenomenon occurred for both loss functions and both PHs (<xref ref-type="fig" rid="F4">Figures&#x00A0;4c,d</xref>, <xref ref-type="fig" rid="F5">5c,d</xref>). Notice that both diabetes-specific metrics show consistency in setting these thresholds. Hence, the proposed DIY module will discard potential users that provide CGM data that would end in a training and validation dataset with less training samples than the correspondent threshold, since it has been demonstrated that this number is not enough to generate a reliable interstitial prediction model using the proposed DL models.</p>
<p><italic>ParkesAB</italic> metric is based on the least restrictive requirement of ISO 15197:2015 (<xref ref-type="bibr" rid="B32">32</xref>), that establishes that at least 99&#x0025; of the prediction errors must fall within certain limits considering the clinically critical glucose concentrations. A DL model whose predictions meet this requirement can be considered clinically safe under this criterion. Studying this metric for the 30-min PH (<xref ref-type="fig" rid="F4">Figures&#x00A0;4c,d</xref> training with <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM37"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>, and <xref ref-type="sec" rid="s11">Supplementary Figure S2a</xref>, <xref ref-type="sec" rid="s11">Supplementary Figure S3a</xref> training with MSE) the three proposed DL models met this requirement within the four validation folds of the 29 subjects. Also, the na&#x00EF;ve approach, except for subjects &#x0023;065 and &#x0023;001, met this ISO requirement, which explains why the most restrictive criteria included in the ISO standard has been also evaluated in this work (i.e., <italic>ISOZone</italic>). Conversely, for the 60-min PH, only 7 out of the 29 subjects met this criterion training with MSE (<xref ref-type="sec" rid="s11">Supplementary Figure S3a</xref>), and 9 out of 29 subjects training with <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM38"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> (<xref ref-type="fig" rid="F5">Figure&#x00A0;5A</xref>). Hence, even though <xref ref-type="table" rid="T1">Table&#x00A0;1</xref> shows unfavorable results of the proposed novel loss function, more subjects are included in the <italic>ParkesAB</italic> acceptable zone for 60-min PH. This evidences the need for performing a subject-oriented evaluation of the DL models when proposing approaches such as a DIY using diabetes-specific metrics (<xref ref-type="bibr" rid="B52">52</xref>). However, the results obtained reveal the need for further improvement in the proposed architectures.</p>
<p><italic>ISOZone</italic> metric, is the most restrictive condition of ISO 15197:2015 (<xref ref-type="bibr" rid="B32">32</xref>), setting the minimum of the prediction errors in 95&#x0025; within the acceptable zone. Thus, fulfilling this requirement would lead to more clinically safe actuations than only fulfilling <italic>ParkesAB</italic> requirement. Unfortunately, the <italic>ISOZone</italic> metric did not surpass 95&#x0025; in any personalized DL model, confirming the fact further improvements in the architectures should be assessed (<xref ref-type="fig" rid="F4">Figures&#x00A0;4b</xref>,5b; <xref ref-type="sec" rid="s11">Supplementary Figure S2b</xref>, <xref ref-type="sec" rid="s11">Supplementary Figure S3b</xref>).</p>
<p>Finally, assessing the inter-subject variability, it is observed that none of the three proposed DL models work optimally for all subjects, although LSTM-based models presented the best average prediction performance (<xref ref-type="table" rid="T1">Table&#x00A0;1</xref>). For example, for the 60-min PH, Dil-UNet prediction in subject &#x0023;055 shows the best <italic>ParkesAB</italic> trained with <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM39"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>, slightly better than LSTM-based models. However, the same model presented by far the worst <italic>ParkesAB</italic> in subject &#x0023;65 compared to LSTM-based models, and slightly worse than the na&#x00EF;ve approach (<xref ref-type="fig" rid="F5">Figure&#x00A0;5a</xref>). The same occurs with the <italic>ISOZone</italic> (<xref ref-type="fig" rid="F5">Figure&#x00A0;5b</xref>). Regarding RMSE, the Stacked-LSTM model trained with MSE presented relatively low variability within folds for both PHs and loss functions, although there are some exceptions (<xref ref-type="sec" rid="s11">Supplementary Figure S4</xref>, <xref ref-type="sec" rid="s11">Supplementary Figure S5</xref>). However, mean and SD variations in all metrics are comparable within all models. Considering that besides the inter-subject variability, the CGM samples of the subjects can present different day-to-day and intra-subject variability (<xref ref-type="bibr" rid="B51">51</xref>), this suggests that the variability and prediction capabilities are strongly dependent on the subject. There is not a DL model that clearly outperforms the rest, but all of them present better prediction performance in the same subjects, although there are some variations related to how a certain architecture has learnt about a given trend of the subject&#x0027;s CGM data.</p>
</sec>
<sec id="s3d"><label>3.4</label><title>Comparison with other state-of-the-art studies</title>
<p>There are many studies in the scientific literature that have assessed the glucose forecasting problem. However, for a fair comparison with this work, the following criteria were used for the selection of other studies:
<list list-type="simple">
<list-item><label>a.</label>
<p>Explicit indications that the glucose prediction was performed in people with T1D.</p></list-item>
<list-item><label>b.</label>
<p>Reported results of 30-min and/or 60-min PHs.</p></list-item>
<list-item><label>c.</label>
<p>Reporting results from a validation and/or test set of real glucose data.</p></list-item>
<list-item><label>d.</label>
<p>The number of subjects included in the evaluation, i.e., <italic>n</italic>, was greater than 5.</p></list-item>
</list><xref ref-type="table" rid="T3">Table&#x00A0;3</xref> shows the comparison between the included studies. It is worth noticing that all the subjects included in the dataset collected and used in our work had sensors with a sampling period of 15&#x2005;min. This limits the temporal information provided to the DL models compared to the other considered studies that included CGM data sampled every 5&#x2005;min. This could be partially mitigated by increasing number of input time steps of the DL models. Moreover, our work and the work presented by De Paoli et al. (<xref ref-type="bibr" rid="B40">40</xref>) were the only ones that fed the models with solely CGM data. This also justifies that the personalized models presented here had the largest input window length within the compared models.</p>
<table-wrap id="T3" position="float"><label>Table 3</label>
<caption><p>Comparison of the proposed DIY framework with other state-of-the-art approaches. Results for 30- and 60-min PHs are shown as mean &#x00B1; SD (when both reported). Best results are highlighted in bold for each metric. Only test or validation results are included. (<italic>n</italic>, number of subjects to evaluate the models; SP, sampling period of the sensors considered in the work; <italic>N</italic>, input window length; Pers. Models: if personalized models were developed in the work; N/A, result not available in the original work).</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left" rowspan="2">Model (&#x0023;subjects)</th>
<th valign="top" align="center" rowspan="2">SP (min)</th>
<th valign="top" align="center" rowspan="2">inputs</th>
<th valign="top" align="center" rowspan="2">N (time)</th>
<th valign="top" align="center" rowspan="2">Train/validation/test periods</th>
<th valign="top" align="center" rowspan="2">Pers. models</th>
<th valign="top" align="center" colspan="3">30-min PH</th>
<th valign="top" align="center" colspan="3">60-min PH</th>
</tr>
<tr>
<th valign="top" align="center">RMSE (mg/dl)</th>
<th valign="top" align="center"><italic>ParkesAB</italic> (&#x0025;)</th>
<th valign="top" align="center"><italic>ISOZone</italic> (&#x0025;)</th>
<th valign="top" align="center">RMSE (mg/dl)</th>
<th valign="top" align="center"><italic>ParkesAB</italic> (&#x0025;)</th>
<th valign="top" align="center"><italic>ISOZone</italic> (&#x0025;)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top">Proposed LSTM and stacked-LSTM<xref ref-type="table-fn" rid="table-fn6"><sup>a</sup></xref> (<italic>n</italic>&#x2009;&#x003D;&#x2009;29)</td>
<td valign="top">&#x2022; 15</td>
<td valign="top">
<list list-type="simple">
<list-item><label>-</label>
<p>CGM</p></list-item>
<list-item><label>-</label>
<p>CGM 1st derivative</p></list-item>
</list></td>
<td valign="top">96 (24&#x2005;h)</td>
<td valign="top">9 months/3 months/(4-fold cross-validation)</td>
<td valign="top">Yes</td>
<td valign="top">21.86&#x2009;&#x00B1;&#x2009;2.86</td>
<td valign="top" align="center"><bold>99.77</bold>&#x2009;<bold>&#x00B1;</bold>&#x2009;<bold>0.19</bold></td>
<td valign="top" align="center"><bold>79.34</bold>&#x2009;<bold>&#x00B1;</bold>&#x2009;<bold>4.95</bold></td>
<td valign="top" align="center">38.44&#x2009;&#x00B1;&#x2009;4.55</td>
<td valign="top" align="center"><bold>97.77</bold>&#x2009;<bold>&#x00B1;</bold>&#x2009;<bold>1.06</bold></td>
<td valign="top" align="center"><bold>56.09</bold>&#x2009;<bold>&#x00B1;</bold>&#x2009;<bold>6.13</bold></td>
</tr>
<tr>
<td valign="top">Multi-input dilated CNN (<xref ref-type="bibr" rid="B24">24</xref>) (<italic>n</italic>&#x2009;&#x003D;&#x2009;97)</td>
<td valign="top">5</td>
<td valign="top">
<list list-type="simple">
<list-item><label>-</label>
<p>CGM</p></list-item>
<list-item><label>-</label>
<p>Meal intake</p></list-item>
<list-item><label>-</label>
<p>Basal insulin rate</p></list-item>
<list-item><label>-</label>
<p>Bolus insulin</p></list-item>
</list></td>
<td valign="top">Multi-step of 36 (3&#x2005;h)</td>
<td valign="top">143.42&#x2009;&#x00B1;&#x2009;90.39 days/-/25.37&#x2009;&#x00B1;&#x2009;4.96 days</td>
<td valign="top">No</td>
<td valign="top">23.22&#x2009;&#x00B1;&#x2009;6.39</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">N/A<xref ref-type="table-fn" rid="table-fn7"><sup>b</sup></xref></td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">N/A</td>
</tr>
<tr>
<td valign="top">Multi-input dilated CNN (<xref ref-type="bibr" rid="B25">25</xref>) (<italic>n</italic>&#x2009;&#x003D;&#x2009;10.6)</td>
<td valign="top">5</td>
<td valign="top">
<list list-type="simple">
<list-item><label>-</label>
<p>CGM</p></list-item>
<list-item><label>-</label>
<p>Insulin</p></list-item>
<list-item><label>-</label>
<p>Meal intake</p></list-item>
<list-item><label>-</label>
<p>Time stamps</p></list-item>
</list></td>
<td valign="top">Sliding window of 16 (1.25&#x2005;h)</td>
<td valign="top"><italic>Dataset 1</italic>: 90 days/-/90 days <italic>Dataset 2</italic>: 40 days/-/10 days</td>
<td valign="top">No</td>
<td valign="top">19.19&#x2009;&#x00B1;&#x2009;2.74 19.28&#x2009;&#x00B1;&#x2009;2.76</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">31.78&#x2009;&#x00B1;&#x2009;4.94 31.83&#x2009;&#x00B1;&#x2009;3.49</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">N/A</td>
</tr>
<tr>
<td valign="top">Jump neural network (<xref ref-type="bibr" rid="B40">40</xref>) (<italic>n</italic>&#x2009;&#x003D;&#x2009;10)</td>
<td valign="top">&#x2013;</td>
<td valign="top">
<list list-type="simple">
<list-item><label>-</label>
<p>CGM</p></list-item>
</list></td>
<td valign="top">N/A<break/>(10&#x2005;min)</td>
<td valign="top">1 day/-/1 day or more</td>
<td valign="top">Yes</td>
<td valign="top" align="center">24.9</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">N/A</td>
</tr>
<tr>
<td valign="top">LSTM (<xref ref-type="bibr" rid="B26">26</xref>) (<italic>n</italic>&#x2009;&#x003D;&#x2009;150)</td>
<td valign="top">5</td>
<td valign="top">
<list list-type="simple">
<list-item><label>-</label>
<p>CGM</p></list-item>
<list-item><label>-</label>
<p>Insulin bolus</p></list-item>
</list></td>
<td valign="top">36 (3&#x2005;h)</td>
<td valign="top">105 subjects/ -/45 subjects</td>
<td valign="top">No</td>
<td valign="top">19.8&#x2009;&#x00B1;&#x2009;3.2</td>
<td valign="top" align="center">99.60</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">33.2&#x2009;&#x00B1;&#x2009;5.4</td>
<td valign="top" align="center">97.60</td>
<td valign="top" align="center">N/A</td>
</tr>
<tr>
<td valign="top">Modified N-BEATS (<xref ref-type="bibr" rid="B44">44</xref>) (<italic><sub>n</sub>&#x2009;</italic><sub>&#x003D;&#x2009;6)</sub></td>
<td valign="top">5</td>
<td valign="top">
<list list-type="simple">
<list-item><label>-</label>
<p>CGM</p></list-item>
<list-item><label>-</label>
<p>Finger stick glucose</p></list-item>
<list-item><label>-</label>
<p>Insulin bolus</p></list-item>
<list-item><label>-</label>
<p>Carbohydrate</p></list-item>
<list-item><label>-</label>
<p>Sine of time</p></list-item>
<list-item><label>-</label>
<p>Cosine of time</p></list-item>
</list></td>
<td valign="top">12&#x2013;42 (1&#x2005;h&#x2014;&#x223C;3 h)</td>
<td valign="top">&#x223C;10,000 samples per subject/-/&#x223C;2,500 samples per subject</td>
<td valign="top">No</td>
<td valign="top">18.22</td>
<td valign="top" align="center">99</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">31.66</td>
<td valign="top" align="center">N/A</td>
<td valign="top" align="center">N/A</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="table-fn6"><label><sup>a</sup></label>
<p>LSTM was the model selected for 30-min PH, and Stacked-LSTM for 60-min PH.</p></fn>
<fn id="table-fn7"><label><sup>b</sup></label>
<p>Evaluation was performed with a smaller subset of 24 subjects that provided more favourable prediction metrics.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>Focusing on De Paoli&#x0027;s work, it is also the only one reporting the development of a personalized model for each subject. Hence, a fair comparison can be assessed. However, they did not report prediction performance at 60-min PH, and neither did diabetes-specific metrics. Our proposed framework outperformed the results obtained by De Paoli&#x0027;s work, which is based on Jump Neural Networks (<xref ref-type="bibr" rid="B40">40</xref>), in terms of RMSE at 30-min PH. Thus, among the only two studies that reported personalized models using only CGM data, our work provided the best prediction performance.</p>
<p>Although the prediction performance of the DIY-based models is mainly limited by the use of only CGM data, our models achieve comparable performance in terms of RMSE to the rest of considered works for 30-min PH. For 60-min PH, these differences are more significant. The model that presents the best RMSE for both PHs is the N-BEATS (<xref ref-type="bibr" rid="B44">44</xref>). For 30-min PH, our LSTM showed similar performance (21.86&#x2009;&#x00B1;&#x2009;2.86 vs. 18.22). This difference is more noticeable for 60-min PHs, where N-BEATS outperforms the Stacked-LSTM (38.44&#x2009;&#x00B1;&#x2009;4.55 against 31.66). Nonetheless, this work only evaluated this model with 6 subjects, whereas we used 29. Moreover, they used several variables as input, including CGM, finger stick glucose, insulin, and carbohydrates intake, among others. It is also worth noticing that our work is the only one reporting <italic>ISOZone</italic> metric, which is the most restrictive criteria of the ISO 15197:2015 standard. Hence, this can serve as a benchmark for comparison in future developments of processing algorithms.</p>
<p>Finally, the <italic>ParkesAB</italic> metric, which is a metric that indicates if the clinical decision based on the predicted CGM labels is clinically safe for the subject, was reported only in two of the studies found in the literature. For the 60-min PH, only one work reported this result without reaching the minimum requirement (&#x2265;99&#x0025;), but our work was closer to the minimum than the LSTM-based model proposed by Mosquera-Lopez et al. (<xref ref-type="bibr" rid="B26">26</xref>) (97.77&#x0025; and 97.60&#x0025;, respectively). For the 30-min PH, the two studies that reported this metric fulfilled the <italic>ParkesAB</italic> requirement. It is worth noticing that the personalized DIY DL models developed in this work presented the best <italic>ParkesAB</italic> metric for both evaluated PHs, evidencing again the limitations of the RMSE as the standard for glucose prediction models comparison. Thus, this approach can be considered the clinically safest among the ones included in this comparative, being the only one that followed a subject-oriented approach for the DL training and validation using only 1-year CGM data from one subject to train the model. Unfortunately, the evaluation of the proposed framework using the OhioT1DM dataset (the most common dataset for glucose forecasting benchmarking) (<xref ref-type="bibr" rid="B53">53</xref>) was not feasible. Our work uses trimester-wise partitions based on 1 year of CGM data, and the OhioT1DM dataset provides only 2 weeks of diabetes-related readings, making impossible to do a fair comparison.</p>
</sec>
<sec id="s3e"><label>3.5</label><title>Evaluation of the DL models using a test set</title>
<p>As a final validation of the DIY DL-based framework for personalized interstitial glucose prediction, additional data from the 29 subjects included in this work were collected to further evaluate the consistency of the above presented results. For every subject, a DL-model was generated using the whole year that was previously partitioned following a 4-folds using <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM40"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub><mml:mo>.</mml:mo></mml:math></inline-formula> Then, the new collected test set was used to evaluate the models. Sensor replacement or data unavailability due to reading interruptions produced a decrease in the number of subjects available for this evaluation. The number of days included in the test set was varied, including 30, 90, 180, and 365 days. This was assessed to analyze if the prediction performance differed depending on the length of the test set. As shown in <xref ref-type="fig" rid="F6">Figure&#x00A0;6</xref>, from the initial 29 subjects, three test sets of subjects were obtained: (1) 20 subjects for testing 30 and 90 days; (2) 19 subjects for testing 180 days; and (3) 7 subjects for testing 365 days. RMSE, <italic>ParkesAB,</italic> and <italic>ISOZone</italic> metrics were analyzed. The boxplots comprise data from <italic>n</italic> subjects, being <italic>n</italic> dependent on the number of days of the test set. Moreover, <xref ref-type="sec" rid="s11">Supplementary Tables S3</xref>, <xref ref-type="sec" rid="s11">Supplementary Table S4</xref> show the mean and SD corresponding to these results for 30- and 60-min PH, respectively.</p>
<fig id="F6" position="float"><label>Figure 6</label>
<caption><p>RMSE, parkesAB, and ISOZone metrics for different test sets after training the personalized models using 1 year of CGM data. The test sets included the first 30, 90, 180, 365 days for each subject (when available). The number of subjects with available data for each experiment is indicated with <italic>n</italic> evaluated with different number of days. For each particular test set the number of subjects with enough available data is indicated with n. The dash line represents the minimum percentage of points in ParkesAB and ISOZone to fulfil the ISO standard. In the boxplots, centre line represents the median, box comprises second and third quartiles, whiskers extend up to 1.5 times the interquartile range, and circles denote outliers. <bold>(a)</bold> 30-min PH. <bold>(b)</bold> 60-min PH.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fdgth-07-1534830-g006.tif"/>
</fig>
<p><xref ref-type="fig" rid="F6">Figure&#x00A0;6</xref>; <xref ref-type="sec" rid="s11">Supplementary Tables S3</xref>, <xref ref-type="sec" rid="s11">Supplementary Table S4</xref> show that, for both PHs, the prediction performances barely change when increasing the number of days included in the test set. The greatest change in terms of the median and variability is observed when the test set includes 365 days. This is more evident for 60-min PH (<xref ref-type="fig" rid="F6">Figure&#x00A0;6B</xref>). However, this is likely related to the significant decrease in the number of subjects included. It can be concluded that, following the DIY-approach after training with 1 year of CGM data, testing with one month of data is representative of the overall personalized model performance.</p>
<p>Comparing results of <xref ref-type="table" rid="T1">Table&#x00A0;1</xref>, that shows the prediction metrics after training the models with 9 months, to <xref ref-type="sec" rid="s11">Supplementary Tables S3</xref>, <xref ref-type="sec" rid="s11">Supplementary Table S4</xref>, that shows RMSE, <italic>ParkesAB</italic> and <italic>ISOZone</italic> metrics after training with the whole year, it is observed a general improvement in RMSE and diabetes-specific metrics. However, the 4-folds cross-validation included 29 subjects, and in the test only 20 subjects were included (for 30 and 90 testing days) due to data unavailability. Thus, this performance improvement might be related both due to training with more data (&#x223C;25&#x0025; more, assuming equal distribution of the CGM readings within the year), and due to include less subjects in the evaluation. Furthermore, it is worth noting that for a 60-min PH, the difference between the Dil-U-Net and the LSTM-based models are less, suggesting that the former benefits more from being trained with more data than the LSTM-based. Concluding, the use of an additional test set validates the prediction performance previously shown and, hence, the competitive performance of the DIY model proposed in this work respect the state-of-the-art.</p>
</sec>
<sec id="s3f"><label>3.6</label><title>DIY module implementation and validation in different operating systems</title>
<p>The design of this open-source module has considered its portability for its standalone use, its easy integration in broader applications regardless of the OS running the software, and its modular design so that researchers and developers can test novel architectures following the proposed DIY approach. To prove that this module is OS-agnostic (i.e., it can run over different OSs), the Python application has been deployed to run in a Docker (<xref ref-type="bibr" rid="B46">46</xref>) container, proving its functionality in two different OSs: Windows 10 and Ubuntu LTS 24.04. Although the current version of this module relies on Docker and terminal prompting from a PC and this is not ideal for the use of most of the people with T1D, the <italic>dockerization</italic> of the app facilitates its fast and straightforward integration in a smartphone application, enhancing its potential daily use. The DIY module usage documentation is available in a GitHub public repository (see &#x201C;<xref ref-type="sec" rid="s5">Data availability</xref>&#x201D; section).</p>
<p>For simplicity, only the LSTM architecture was implemented, since it presented the shortest training times with competitive performance. <xref ref-type="fig" rid="F7">Figure&#x00A0;7</xref> shows the workflow of the DIY module from the user&#x0027;s perspective, in a smartphone, even this module is ready to run on a PC, including the first and subsequent uses, considering the cases when the user provides enough data or not, illustrating the information that is prompted to the user. This design was developed through a co-creation process after carrying out several focus groups that included potential users of this module, and it pursuits user engagement, useful interaction, and information supply regarding their personalized AI models.</p>
<fig id="F7" position="float"><label>Figure 7</label>
<caption><p>DIY module workflow from the user&#x0027;s perspective. Notice that the first use of the model implies the model generation and evaluation (if enough data is provided). The user&#x0027;s second use only implies the model call and the computation of the 30-min prediction. This workflow considered the scenarios when the user provides or does not have enough data to generate the DL models. Besides, the DIY module prompts the user with messages regarding the provided CGM data, information about the generation (or lack of it) of the AI model, and with alerts if a hypoglycemic of hyperglycemic event is predicted.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fdgth-07-1534830-g007.tif"/>
</fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion"><label>4</label><title>Discussion</title>
<p>To the best of our knowledge, this work has presented, for the first time, a DIY module for personalized AI-based interstitial glucose forecasting for people with T1D using only the CGM user data without involving data from other subjects to train the DL models. Additional data, such as physical activity or carbohydrates intake, was not available in the collected data, but the parametrized design of the module will allow its straightforward inclusion as model inputs. The DL models evaluated in the proposed framework presented similar prediction performance results in terms of RMSE, and the best results in a diabetes-specific metric, <italic>ParkesAB</italic>, when compared to the state-of-the-art, outperforming other LSTM- and CNN-based approaches (<xref ref-type="bibr" rid="B24">24</xref>, <xref ref-type="bibr" rid="B26">26</xref>) or modern algorithms designed for time series forecasting, such as N-BEATS (<xref ref-type="bibr" rid="B44">44</xref>). Our results were achieved using only CGM data, whereas most of the comparable studies included also insulin and meal intake as input features in their models (<xref ref-type="bibr" rid="B24">24</xref>&#x2013;<xref ref-type="bibr" rid="B26">26</xref>, <xref ref-type="bibr" rid="B44">44</xref>). Additionally, 1 year of CGM data was used for the training and validation of the models, being able to capture more seasons-related phenomena compared to other public available standard datasets for benchmarking glucose prediction models, e.g., the Ohio T1DM Dataset (<xref ref-type="bibr" rid="B53">53</xref>) which contains only eight weeks. The differences in the duration of the acquired dataset made unfeasible a fair comparison of this framework using this dataset. Unlike most of the previously mentioned studies, the development of the DL models in our study was fully personalized (only data from a single subject was employed to train the algorithms). Moreover, to the best of our knowledge, this is the first work that evaluates acceptable <italic>ISOZone</italic> metric, the most restrictive criteria of ISO 15197:2015 (<xref ref-type="bibr" rid="B32">32</xref>), although the proposed DL-models did not fulfil this requirement.</p>
<p>This study also evidenced the need for selecting a diabetes-oriented error metric as a gold standard to compare different glucose prediction models. Results obtained in this work demonstrated that a lower RMSE does not always imply a better prediction in the context of T1D. For example, if a model perfectly predicts all glucose samples that are in range (which are, by far, more than the hypo- and hyper-glycemic samples), it will likely present a lower RMSE than a model that has smaller errors in the critical samples (i.e., hypo- and hyper-glycemic samples), and larger error in the non-critical ones. The latter model will be more clinically useful and safe for this task but would be considered a &#x201C;worse&#x201D; model if only RMSE is evaluated. Hence, the use of metrics such as <italic>ISOZone</italic>, <italic>ParkesAB</italic>, or different indexes derived from the diabetic-specific case (<xref ref-type="bibr" rid="B26">26</xref>) are pivotal to have an appropriate evaluation of these models (<xref ref-type="bibr" rid="B52">52</xref>).</p>
<p>A trimester-wise 4-folds cross-validation was assessed targeting a robust evaluation of the DL models. For each subject (<italic>n</italic>&#x2009;&#x003D;&#x2009;29), the models were trained four times, varying the groups of three trimesters used to train the models and the remaining trimester to test them. This approach aimed to demonstrate if, for the proposed architectures, the prediction performance depended on the time of the year used to train and test the DL models. This dependence varied between different subjects, evidencing the burden of the inter-subject variability. Hence, the obtained results suggested that training the models with weeks or even months of data could not be enough, since there are phenomena that might not been considered in the training of the models (habit changes, holidays, periods of increased or decreased activity, etc. that varies over the year). By taking 1 year of data, the negative impact of such intra-subject variability (<xref ref-type="bibr" rid="B51">51</xref>) can be potentially diminished. The results obtained using the test set after collecting additional data and training the DL models with 1 year of CGM data support this hypothesis, since the prediction performance slightly improved. Besides, results showed that, with this approach, testing with 1 month of data is representative of the overall performance of the personalized DL models.</p>
<p>A novel loss function, <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM41"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>, has been developed to train the DL algorithms. To the best of our knowledge, this is the first work that presents a loss function considering the ISO 15197:2015 standard (<xref ref-type="bibr" rid="B32">32</xref>), tailoring the training of the DL models for the interstitial glucose forecasting task. Obtained results are comparable to the standard MSE-based loss function, improving the results in the <italic>ParkesAB</italic> metric for 60-min PH respect to the MSE. Further tuning of <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM42"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> could improve the prediction metric by leading to a more aggressive penalization to the clinically critical errors in glucose prediction. Thus, higher <italic>ParkesAB</italic> and <italic>ISOZone</italic> values could be achieved, potentially outperforming the MSE loss function in the most clinically critical situations of glucose forecasting task. Furthermore, the design of <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM43"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> could have a higher influence on the most vulnerable subjects, i.e., the ones with more hypo- and hyper-glycemic episodes, since it penalizes more the errors for these critical ranges. In this work, no direct relations between prediction performance and the occurrence such episodes were observed (see <xref ref-type="sec" rid="s11">Supplementary Figure S9</xref>; <xref ref-type="fig" rid="F4">Figures&#x00A0;4</xref>, <xref ref-type="fig" rid="F5">5</xref>).</p>
<p>The inter-subject variability and the dependence of the prediction performance with the available CGM training samples have also been assessed in this work. This is also innovative regarding DL glucose prediction models evaluation. With the proposed LSTM-based and Dil-UNet architectures, no single model has shown optimal prediction performance for all subjects and no statistically significant differences were found between the three architectures. However, in general, the three models showed their best and worst prediction performance with the same subjects regardless of the available training samples. Nonetheless, the comparison of the na&#x00EF;ve approach with the proposed architectures allowed to establish a preliminary threshold for both PHs below which was not feasible to generate a reliable personalized DL model. This suggests that inter-subject variability was the main limiting factor to achieve more accurate prediction average results. More complex models specifically designed for time series forecasting, such as N-BEATS (<xref ref-type="bibr" rid="B54">54</xref>), or TSMixer (<xref ref-type="bibr" rid="B55">55</xref>) could deal with the impact of this phenomena, but it will not remove it.</p>
<p>In this work, it was decided not to include interpolation to deal with the missing data produced by CGM reading interruptions in the training, validation or test sets to assess the model analysis only on real data. Hence, unlike other DL-based approaches to predict glucose concentrations that implemented various types of interpolation when there was a reading interruption within 30&#x2005;min or 1&#x2005;h (<xref ref-type="bibr" rid="B24">24</xref>&#x2013;<xref ref-type="bibr" rid="B26">26</xref>, <xref ref-type="bibr" rid="B40">40</xref>), the dataset size was significantly decreased in some subjects that contained a considerable number of CGM reading interruptions. The impact of the interpolation can be studied in further work, since the personalized DL-models, especially in those subjects with a number of samples near the threshold, could benefit from a larger number of training and validation samples. Furthermore, in non-personalized models (i.e., that are trained with data from more than one subject), lack of data from one subject can be compensated by others that contribute with more instances. Here, in this work, sensor misfunction or disconnection will lead to the impossibility of a reliable DL model generation.</p>
<p>The DIY module that encapsulates the personalized DL-models was designed considering the daily habits of people with T1D, enhancing personalization and including a subject-oriented models training and evaluation. This was performed supported by a co-creation process through the arrangement of focus groups where potential users of this module offered feedback regarding their needs and preferences of this module. The idea underlying this design was the users&#x0027; engagement through their empowerment regarding the relationship between AI and their data (<xref ref-type="bibr" rid="B30">30</xref>), for example by providing them with information about why their models could (or could not) be generated. Furthermore, it is the user who decides when to be prompted with a glucose prediction or with additional information, thus avoiding the overwhelmingness associated with excessive and non-required information. Its modular design and containerization also facilitate its integration in other applications. However, its integration in smartphone OSs (namely, Android or iOS) is part of future work, to potentially reaching broader populations. In fact, this module is expected to be fully or partly integrated in the WARIFA application (<xref ref-type="bibr" rid="B31">31</xref>), as a result of a European project that has designed an application to prevent and manage diverse chronic conditions. As demonstrated in this work, this module is ready to be used standalone in Windows and Ubuntu, as it is already functional and publicly available (see Code Availability). Hence, this DIY module has the potential to have an immediate and positive impact on people who suffer from T1D, although there is more research work to do regarding DL model generation to reach better prediction performance for longer PHs. Additionally, being open source and exhaustively documented, AI researchers and developers could test novel DL architectures that could offer more accurate glucose predictions, use this DIY framework with data from different sensors from the ones employed in this work, integrate this module in an existent application, or enhance the module design from the usability perspective.</p>
<p>Although the DIY paradigm has been validated for T1D, its implementation can extend to other types of diabetes that are using CGM, such as type 2 diabetes (<xref ref-type="bibr" rid="B56">56</xref>). Besides, this methodology and the tool itself could be adapted and used for people with different chronic conditions that require continuous monitoring of body signals, and where a computer-aided system can be helpful for clinicians and individuals, such as cardiovascular diseases monitored with wearables devices (<xref ref-type="bibr" rid="B57">57</xref>).</p>
<p>Several future opportunities open up after the realization of this work. Firstly, the inclusion of diabetes-related input variables for the DL models, such as insulin, physical activity and carbohydrates intake, that would likely improve prediction performance (<xref ref-type="bibr" rid="B44">44</xref>). In this line, the framework might be adapted to generate DL models with less CGM data [e.g., 2 weeks, like the OhioT1DM dataset (<xref ref-type="bibr" rid="B53">53</xref>)]. Reducing the monitoring time would likely facilitate the presence of additional diabetes-related variables (e.g., carbohydrate intake, or insulin administration). Additionally, this would allow for easier comparison with other state-of-the-art methods. Related to this, the development of DL architectures that could provide reliable 60-min (and beyond) forecasting should be explored, aiming to increase the positive impact that this tool might have on people&#x0027;s glycemic control. Besides, experiments on parameter tuning of <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM44"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> loss function could be carried out. Obtained results suggest that architectures with more parameters can follow the <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM45"><mml:msub><mml:mi>L</mml:mi><mml:mrow><mml:mi>I</mml:mi><mml:mi>S</mml:mi><mml:mi>O</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> penalizations better, but they should be exhaustively studied. Regarding input data, apart from the inclusion of the abovementioned information, prediction performance could significantly benefit from the inclusion of other heterogeneous data, such as glycemic biomarkers, data from electronic health records, etc. Even though these are not real time acquired data, the data fusion paradigm could be explored to evaluate their impact on this task (<xref ref-type="bibr" rid="B58">58</xref>). Finally, messages prompted by the DIY module are currently static and equal for all users. However, the potential of the generative AI to personalize not only the CGM prediction, but also the feedback messages provided by this tool, suggest that its implementation on this module will likely increase user&#x0027;s engagement, enhancing our subject-oriented approach (<xref ref-type="bibr" rid="B59">59</xref>).</p>
<p>Moreover, if this module is used extensively and constantly over time, model maintenance strategy is a field to be explored, since DL models can lose performance with time (<xref ref-type="bibr" rid="B60">60</xref>). Strategies such as transfer learning (<xref ref-type="bibr" rid="B47">47</xref>), to re-train the models with new subject&#x0027;s data, or federated learning (<xref ref-type="bibr" rid="B61">61</xref>), to employ data from different subjects in the personalized models and to intend a distributed computation of such models, should be studied.</p>
<p>Finally, a pilot study should be carried out to evaluate the real impact of the AI-based DIY module on the daily life of people with T1D. A clinical study also could help to know if this module, as a computer-aid device for the users, will help people to increase their TIR, i.e., to have their glucose concentrations in a healthy range.</p>
</sec>
</body>
<back>
<sec id="s5" sec-type="data-availability"><title>Data availability statement</title>
<p>The original contributions presented in the study are publicly available. The code underlying this research can be found here: <ext-link ext-link-type="uri" xlink:href="https://github.com/antorguez95/Personalized-AI-Based-Do-It-Yourself-Glucose-Prediction-tool">https://github.com/antorguez95/Personalized-AI-Based-Do-It-Yourself-Glucose-Prediction-tool</ext-link>.</p>
</sec>
<sec id="s6" sec-type="ethics-statement"><title>Ethics statement</title>
<p>Written informed consent was obtained from the individual(s) for the publication of any potentially identifiable images or data included in this article.</p>
</sec>
<sec id="s7" sec-type="author-contributions"><title>Author contributions</title>
<p>AR: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing, Conceptualization, Data curation, Investigation, Software. GS: Writing &#x2013; review &#x0026; editing, Conceptualization, Investigation. CB: Writing &#x2013; review &#x0026; editing, Data curation, Visualization. GZ: Writing &#x2013; review &#x0026; editing, Conceptualization, Investigation, Visualization. AD: Writing &#x2013; review &#x0026; editing, Visualization. M&#x00C1;: Writing &#x2013; review &#x0026; editing, Investigation, Visualization. E&#x00C5;: Writing &#x2013; review &#x0026; editing, Funding acquisition. CS: Writing &#x2013; review &#x0026; editing, Funding acquisition. AW: Writing &#x2013; review &#x0026; editing, Funding acquisition. CG: Writing &#x2013; review &#x0026; editing, Funding acquisition. GC: Writing &#x2013; review &#x0026; editing, Funding acquisition, Supervision, Resources. HF: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing, Conceptualization, Investigation, Funding acquisition, Supervision.</p>
</sec>
<sec id="s8" sec-type="funding-information"><title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This project has received funding from the European Union's Horizon 2020 research and innovation programme under grant agreement No 101017385. Additionally, this work was completed while Antonio Rodr&#x00ED;guez was beneficiary of a pre-doctoral grant given by the &#x201C;Agencia Canaria de Investigaci&#x00F3;n, Innovaci&#x00F3;n y Sociedad de la Informaci&#x00F3;n (ACIISI)&#x201D; of the &#x201C;Consejer&#x00ED;a de Econom&#x00ED;a, Conocimiento y Empleo&#x201D; of the &#x201C;Gobierno de Canarias&#x201D;, which is part-financed by the European Social Fund (FSE) (POC 2014-2020, Eje 3 Tema Prioritario 74 (85 &#x0025;)).</p>
</sec>
<ack><title>Acknowledgments</title>
<p>The authors want to thank Abi&#x00E1;n Hernandez Guedes for sharing part of his vast knowledge about Deep Learning, enriching the assessment of the CGM forecast problem. Besides, they also want to thank Raquel Leon and Laura Quintana Quintana for their always valuable and clarifying points of view, improving the visualization of this tool. Finally, thank the participants who donated their data and any clinicians inviting people and who do not qualify as co-authors.</p>
</ack>
<sec id="s9" sec-type="COI-statement"><title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="ai-statement"><title>Generative AI statement</title>
<p>The authors declare that no Generative AI was used in the creation of this manuscript.</p>
</sec>
<sec id="s12" sec-type="disclaimer"><title>Publisher&#x0027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11" sec-type="supplementary-material"><title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fdgth.2025.1534830/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fdgth.2025.1534830/full&#x0023;supplementary-material</ext-link></p>
<supplementary-material id="SD1" content-type="local-data">
<media mimetype="application" mime-subtype="pdf" xlink:href="Datasheet1.pdf"/></supplementary-material>
</sec>
<ref-list><title>References</title>
<ref id="B1"><label>1.</label><citation citation-type="book"><collab>IDF Diabetes Atlas 10th Edition Scientific Committee</collab>. <source>IDF Diabetes Atlas</source>. <publisher-loc>Brussels</publisher-loc>: <publisher-name>International Diabetes Federation</publisher-name> (<year>2021</year>).</citation></ref>
<ref id="B2"><label>2.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mackenzie</surname><given-names>SC</given-names></name><name><surname>Sainsbury</surname><given-names>CAR</given-names></name><name><surname>Wake</surname><given-names>DJ</given-names></name></person-group>. <article-title>Diabetes and artificial intelligence beyond the closed loop: a review of the landscape, promise and challenges</article-title>. <source>Diabetologia</source>. (<year>2023</year>) <volume>67</volume>:<fpage>223</fpage>&#x2013;<lpage>35</lpage>. <pub-id pub-id-type="doi">10.1007/s00125-023-06038-8</pub-id><pub-id pub-id-type="pmid">37979006</pub-id></citation></ref>
<ref id="B3"><label>3.</label><citation citation-type="other"><article-title>World Health Organization. Diabetes</article-title> (<year>2024</year>). <comment>Available at:</comment> <ext-link ext-link-type="uri" xlink:href="https://www.who.int/news-room/fact-sheets/detail/diabetes">https://www.who.int/news-room/fact-sheets/detail/diabetes</ext-link> <comment>(Accessed January 18, 2024)</comment>.</citation></ref>
<ref id="B4"><label>4.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Deshpande</surname><given-names>AD</given-names></name><name><surname>Harris-Hayes</surname><given-names>M</given-names></name><name><surname>Schootman</surname><given-names>M</given-names></name></person-group>. <article-title>Epidemiology of diabetes and diabetes-related complications</article-title>. <source>Phys Ther</source>. (<year>2008</year>) <volume>88</volume>(<issue>11</issue>):<fpage>1254</fpage>&#x2013;<lpage>64</lpage>. <pub-id pub-id-type="doi">10.2522/ptj.20080020</pub-id><pub-id pub-id-type="pmid">18801858</pub-id></citation></ref>
<ref id="B5"><label>5.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Atkinson</surname><given-names>MA</given-names></name><name><surname>Eisenbarth</surname><given-names>GS</given-names></name><name><surname>Michels</surname><given-names>AW</given-names></name></person-group>. <article-title>Type 1 diabetes</article-title>. <source>Lancet</source>. (<year>2014</year>) <volume>383</volume>:<fpage>69</fpage>&#x2013;<lpage>82</lpage>. <pub-id pub-id-type="doi">10.1016/S0140-6736(13)60591-7</pub-id><pub-id pub-id-type="pmid">23890997</pub-id></citation></ref>
<ref id="B6"><label>6.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>McCrimmon</surname><given-names>RJ</given-names></name><name><surname>Sherwin</surname><given-names>RS</given-names></name></person-group>. <article-title>Hypoglycemia in type 1 diabetes</article-title>. <source>Diabetes</source>. (<year>2010</year>) <volume>59</volume>:<fpage>2333</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.2337/db10-0103</pub-id><pub-id pub-id-type="pmid">20876723</pub-id></citation></ref>
<ref id="B7"><label>7.</label><citation citation-type="journal"><collab>Diabetes Control and Complications Trial Research Group</collab>. <article-title>Effect of intensive diabetes treatment on the development and progression of long-term complications in adolescents with insulin-dependent diabetes mellitus: diabetes control and complications trial</article-title>. <source>J Pediatr</source>. (<year>1994</year>) <volume>125</volume>(<issue>2</issue>):<fpage>177</fpage>&#x2013;<lpage>88</lpage>. <pub-id pub-id-type="doi">10.1016/S0022-3476(94)70190-3</pub-id><pub-id pub-id-type="pmid">8040759</pub-id></citation></ref>
<ref id="B8"><label>8.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vettoretti</surname><given-names>M</given-names></name><name><surname>Cappon</surname><given-names>G</given-names></name><name><surname>Acciaroli</surname><given-names>G</given-names></name><name><surname>Facchinetti</surname><given-names>A</given-names></name><name><surname>Sparacino</surname><given-names>G</given-names></name></person-group>. <article-title>Continuous glucose monitoring: current use in diabetes management and possible future applications</article-title>. <source>J Diabetes Sci Technol</source>. (<year>2018</year>) <volume>12</volume>(<issue>5</issue>):<fpage>1064</fpage>&#x2013;<lpage>71</lpage>. <pub-id pub-id-type="doi">10.1177/1932296818774078</pub-id><pub-id pub-id-type="pmid">29783897</pub-id></citation></ref>
<ref id="B9"><label>9.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Perkins</surname><given-names>BA</given-names></name><name><surname>Sherr</surname><given-names>JL</given-names></name><name><surname>Mathieu</surname><given-names>C</given-names></name></person-group>. <article-title>Type 1 diabetes glycemic management: insulin therapy, glucose monitoring, and automation</article-title>. <source>Science</source>. (<year>2021</year>) <volume>373</volume>. <pub-id pub-id-type="doi">10.1126/science.abg4502</pub-id><pub-id pub-id-type="pmid">34326234</pub-id></citation></ref>
<ref id="B10"><label>10.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Battelino</surname><given-names>T</given-names></name><name><surname>Danne</surname><given-names>T</given-names></name><name><surname>Bergenstal</surname><given-names>RM</given-names></name><name><surname>Amiel</surname><given-names>SA</given-names></name><name><surname>Beck</surname><given-names>R</given-names></name><name><surname>Biester</surname><given-names>T</given-names></name><etal/></person-group> <article-title>Clinical targets for continuous glucose monitoring data interpretation: recommendations from the international consensus on time in range</article-title>. <source>Diabetes Care</source>. (<year>2019</year>) <volume>42</volume>(<issue>8</issue>):<fpage>1593</fpage>&#x2013;<lpage>603</lpage>. <pub-id pub-id-type="doi">10.2337/dci19-0028</pub-id><pub-id pub-id-type="pmid">31177185</pub-id></citation></ref>
<ref id="B11"><label>11.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tamborlane</surname><given-names>WV</given-names></name><name><surname>Beck</surname><given-names>RW</given-names></name><name><surname>Bode</surname><given-names>BW</given-names></name><name><surname>Buckingham</surname><given-names>B</given-names></name><name><surname>Chase</surname><given-names>HP</given-names></name><name><surname>Clemons</surname><given-names>R</given-names></name><etal/></person-group> <article-title>Continuous glucose monitoring and intensive treatment of type 1 diabetes</article-title>. <source>N Engl J Med</source>. (<year>2008</year>) <volume>359</volume>(<issue>14</issue>):<fpage>1464</fpage>&#x2013;<lpage>76</lpage>. <pub-id pub-id-type="doi">10.1056/NEJMoa0805017</pub-id><pub-id pub-id-type="pmid">18779236</pub-id></citation></ref>
<ref id="B12"><label>12.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hamine</surname><given-names>S</given-names></name><name><surname>Gerth-Guyette</surname><given-names>E</given-names></name><name><surname>Faulx</surname><given-names>D</given-names></name><name><surname>Green</surname><given-names>BB</given-names></name><name><surname>Ginsburg</surname><given-names>AS</given-names></name></person-group>. <article-title>Impact of mHealth chronic disease management on treatment adherence and patient outcomes: a systematic review</article-title>. <source>J Med Internet Res</source>. (<year>2015</year>) <volume>17</volume>:<fpage>e3951</fpage>. <pub-id pub-id-type="doi">10.2196/jmir.3951</pub-id></citation></ref>
<ref id="B13"><label>13.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Agnihothri</surname><given-names>S</given-names></name><name><surname>Cui</surname><given-names>L</given-names></name><name><surname>Delasay</surname><given-names>M</given-names></name><name><surname>Rajan</surname><given-names>B</given-names></name></person-group>. <article-title>The value of mHealth for managing chronic conditions</article-title>. <source>Health Care Manag Sci</source>. (<year>2020</year>) <volume>23</volume>(<issue>2</issue>):<fpage>185</fpage>&#x2013;<lpage>202</lpage>. <pub-id pub-id-type="doi">10.1007/s10729-018-9458-2</pub-id><pub-id pub-id-type="pmid">30382448</pub-id></citation></ref>
<ref id="B14"><label>14.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname><given-names>JM</given-names></name><name><surname>Newman</surname><given-names>MW</given-names></name><name><surname>Gebremariam</surname><given-names>A</given-names></name><name><surname>Choi</surname><given-names>P</given-names></name><name><surname>Lewis</surname><given-names>D</given-names></name><name><surname>Nordgren</surname><given-names>W</given-names></name><etal/></person-group> <article-title>Real-world use and self-reported health outcomes of a patient-designed do-it-yourself mobile technology system for diabetes: lessons for mobile health</article-title>. <source>Diabetes Technol Ther</source>. (<year>2017</year>) <volume>19</volume>(<issue>4</issue>):<fpage>209</fpage>&#x2013;<lpage>19</lpage>. <pub-id pub-id-type="doi">10.1089/dia.2016.0312</pub-id><pub-id pub-id-type="pmid">28245152</pub-id></citation></ref>
<ref id="B15"><label>15.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Morrison</surname><given-names>AE</given-names></name><name><surname>Chong</surname><given-names>K</given-names></name><name><surname>Senior</surname><given-names>PA</given-names></name><name><surname>Lam</surname><given-names>A</given-names></name></person-group>. <article-title>A scoping review of do-it-yourself automated insulin delivery system (DIY AID) use in people with type 1 diabetes</article-title>. <source>PLoS One</source>. (<year>2022</year>) <volume>17</volume>(<issue>8</issue>):<fpage>e0271096</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0271096</pub-id><pub-id pub-id-type="pmid">35951597</pub-id></citation></ref>
<ref id="B16"><label>16.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname><given-names>JM</given-names></name><name><surname>Hirschfeld</surname><given-names>E</given-names></name><name><surname>Wedding</surname><given-names>J</given-names></name></person-group>. <article-title>A patient-designed do-it-yourself mobile technology system for diabetes: promise and challenges for a new era in medicine</article-title>. <source>JAMA</source>. (<year>2016</year>) <volume>315</volume>:<fpage>1447</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1001/jama.2016.1903</pub-id><pub-id pub-id-type="pmid">27115262</pub-id></citation></ref>
<ref id="B17"><label>17.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Deniz-Garcia</surname><given-names>A</given-names></name><name><surname>Fabelo</surname><given-names>H</given-names></name><name><surname>Rodriguez-Almeida</surname><given-names>AJ</given-names></name><name><surname>Zamora-Zamorano</surname><given-names>G</given-names></name><name><surname>Castro-Fernandez</surname><given-names>M</given-names></name><name><surname>del Pino Alberiche Ruano</surname><given-names>M</given-names></name><etal/></person-group> <article-title>Quality, usability, and effectiveness of mHealth apps and the role of artificial intelligence: current scenario and challenges</article-title>. <source>J Med Internet Res</source>. (<year>2023</year>) <volume>25</volume>(<issue>1</issue>):<fpage>e44030</fpage>. <pub-id pub-id-type="doi">10.2196/44030</pub-id><pub-id pub-id-type="pmid">37140973</pub-id></citation></ref>
<ref id="B18"><label>18.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lum</surname><given-names>JW</given-names></name><name><surname>Bailey</surname><given-names>RJ</given-names></name><name><surname>Barnes-Lomen</surname><given-names>V</given-names></name><name><surname>Naranjo</surname><given-names>D</given-names></name><name><surname>Hood</surname><given-names>KK</given-names></name><name><surname>Lal</surname><given-names>RA</given-names></name><etal/></person-group> <article-title>A real-world prospective study of the safety and effectiveness of the loop open source automated insulin delivery system</article-title>. <source>Diabetes Technol Ther</source>. (<year>2021</year>) <volume>23</volume>(<issue>5</issue>):<fpage>367</fpage>&#x2013;<lpage>75</lpage>. <pub-id pub-id-type="doi">10.1089/dia.2020.0535</pub-id><pub-id pub-id-type="pmid">33226840</pub-id></citation></ref>
<ref id="B19"><label>19.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>X</given-names></name><name><surname>Shu</surname><given-names>W</given-names></name><name><surname>Du</surname><given-names>J</given-names></name><name><surname>Du</surname><given-names>M</given-names></name><name><surname>Wang</surname><given-names>P</given-names></name><name><surname>Xue</surname><given-names>M</given-names></name><etal/></person-group> <article-title>Mobile health in the management of type 1 diabetes: a systematic review and meta-analysis</article-title>. <source>BMC Endocr Disord</source>. (<year>2019</year>) <volume>19</volume>(<issue>1</issue>):<fpage>1</fpage>&#x2013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1186/s12902-019-0347-6</pub-id><pub-id pub-id-type="pmid">30606164</pub-id></citation></ref>
<ref id="B20"><label>20.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Revert</surname><given-names>A</given-names></name><name><surname>Garelli</surname><given-names>F</given-names></name><name><surname>Pico</surname><given-names>J</given-names></name><name><surname>De Battista</surname><given-names>H</given-names></name><name><surname>Rossetti</surname><given-names>P</given-names></name><name><surname>Vehi</surname><given-names>J</given-names></name><etal/></person-group> <article-title>Safety auxiliary feedback element for the artificial pancreas in type 1 diabetes</article-title>. <source>IEEE Trans Biomed Eng</source>. (<year>2013</year>) <volume>60</volume>(<issue>8</issue>):<fpage>2113</fpage>&#x2013;<lpage>22</lpage>. <pub-id pub-id-type="doi">10.1109/TBME.2013.2247602</pub-id><pub-id pub-id-type="pmid">23428611</pub-id></citation></ref>
<ref id="B21"><label>21.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bequette</surname><given-names>BW</given-names></name></person-group>. <article-title>Challenges and recent progress in the development of a closed-loop artificial pancreas</article-title>. <source>Annu Rev Control</source>. (<year>2012</year>) <volume>36</volume>(<issue>2</issue>):<fpage>255</fpage>&#x2013;<lpage>66</lpage>. <pub-id pub-id-type="doi">10.1016/j.arcontrol.2012.09.007</pub-id><pub-id pub-id-type="pmid">23175620</pub-id></citation></ref>
<ref id="B22"><label>22.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>De Bois</surname><given-names>M</given-names></name><name><surname>Yacoubi</surname><given-names>MAE</given-names></name><name><surname>Ammi</surname><given-names>M</given-names></name></person-group>. <article-title>GLYFE: review and benchmark of personalized glucose predictive models in type 1 diabetes</article-title>. <source>Med Biol Eng Comput</source>. (<year>2022</year>) <volume>60</volume>:<fpage>1</fpage>&#x2013;<lpage>17</lpage>. <pub-id pub-id-type="doi">10.1007/s11517-021-02437-4</pub-id><pub-id pub-id-type="pmid">34751904</pub-id></citation></ref>
<ref id="B23"><label>23.</label><citation citation-type="confproc"><person-group person-group-type="author"><name><surname>Bunescu</surname><given-names>R</given-names></name><name><surname>Struble</surname><given-names>N</given-names></name><name><surname>Marling</surname><given-names>C</given-names></name><name><surname>Shubrook</surname><given-names>J</given-names></name><name><surname>Schwartz</surname><given-names>F</given-names></name></person-group>. <article-title>Blood glucose level prediction using physiological models and support vector regression</article-title>. In: <conf-name>Proceedings&#x2014;2013 12th International Conference on Machine Learning and Applications, ICMLA 2013</conf-name>; <publisher-name>IEEE Computer Society</publisher-name> (<year>2013</year>). p. <fpage>135</fpage>&#x2013;<lpage>40</lpage>.</citation></ref>
<ref id="B24"><label>24.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zaidi</surname><given-names>SMA</given-names></name><name><surname>Chandola</surname><given-names>V</given-names></name><name><surname>Ibrahim</surname><given-names>M</given-names></name><name><surname>Romanski</surname><given-names>B</given-names></name><name><surname>Mastrandrea</surname><given-names>LD</given-names></name><name><surname>Singh</surname><given-names>T</given-names></name></person-group>. <article-title>Multi-step ahead predictive model for blood glucose concentrations of type-1 diabetic patients</article-title>. <source>Sci Rep</source>. (<year>2021</year>) <volume>11</volume>(<issue>1</issue>):<fpage>1</fpage>&#x2013;<lpage>14</lpage>. <pub-id pub-id-type="doi">10.1038/s41598-021-03341-5</pub-id><pub-id pub-id-type="pmid">33414495</pub-id></citation></ref>
<ref id="B25"><label>25.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>K</given-names></name><name><surname>Liu</surname><given-names>C</given-names></name><name><surname>Zhu</surname><given-names>T</given-names></name><name><surname>Herrero</surname><given-names>P</given-names></name><name><surname>Georgiou</surname><given-names>P</given-names></name></person-group>. <article-title>Glunet: a deep learning framework for accurate glucose forecasting</article-title>. <source>IEEE J Biomed Health Inform</source>. (<year>2020</year>) <volume>24</volume>(<issue>2</issue>):<fpage>414</fpage>&#x2013;<lpage>23</lpage>. <pub-id pub-id-type="doi">10.1109/JBHI.2019.2931842</pub-id><pub-id pub-id-type="pmid">31369390</pub-id></citation></ref>
<ref id="B26"><label>26.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mosquera-Lopez</surname><given-names>C</given-names></name><name><surname>Jacobs</surname><given-names>PG</given-names></name></person-group>. <article-title>Incorporating glucose variability into glucose forecasting accuracy assessment using the new glucose variability impact Index and the prediction consistency Index: an LSTM case example</article-title>. <source>J Diabetes Sci Technol</source>. (<year>2022</year>) <volume>16</volume>(<issue>1</issue>):<fpage>7</fpage>&#x2013;<lpage>18</lpage>. <pub-id pub-id-type="doi">10.1177/19322968211042621</pub-id><pub-id pub-id-type="pmid">34490793</pub-id></citation></ref>
<ref id="B27"><label>27.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fatehi</surname><given-names>F</given-names></name><name><surname>Menon</surname><given-names>A</given-names></name><name><surname>Bird</surname><given-names>D</given-names></name></person-group>. <article-title>Diabetes care in the digital era: a synoptic overview</article-title>. <source>Curr Diab Rep</source>. (<year>2018</year>) <volume>18</volume>(<issue>7</issue>):<fpage>1</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1007/s11892-018-1013-5</pub-id><pub-id pub-id-type="pmid">29362940</pub-id></citation></ref>
<ref id="B28"><label>28.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nurgalieva</surname><given-names>L</given-names></name><name><surname>O&#x2019;Callaghan</surname><given-names>D</given-names></name><name><surname>Doherty</surname><given-names>G</given-names></name></person-group>. <article-title>Security and privacy of mHealth applications: a scoping review</article-title>. <source>IEEE Access</source>. (<year>2020</year>) <volume>8</volume>:<fpage>104247</fpage>&#x2013;<lpage>68</lpage>. <pub-id pub-id-type="doi">10.1109/ACCESS.2020.2999934</pub-id></citation></ref>
<ref id="B29"><label>29.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Atienza</surname><given-names>AA</given-names></name><name><surname>Zarcadoolas</surname><given-names>C</given-names></name><name><surname>Vaughon</surname><given-names>W</given-names></name><name><surname>Hughes</surname><given-names>P</given-names></name><name><surname>Patel</surname><given-names>V</given-names></name><name><surname>Chou</surname><given-names>WYS</given-names></name><etal/></person-group> <article-title>Consumer attitudes and perceptions on mhealth privacy and security: findings from a mixed-methods study</article-title>. <source>J Health Commun</source>. (<year>2015</year>) <volume>20</volume>(<issue>6</issue>):<fpage>673</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1080/10810730.2015.1018560</pub-id><pub-id pub-id-type="pmid">25868685</pub-id></citation></ref>
<ref id="B30"><label>30.</label><citation citation-type="other"><person-group person-group-type="author"><name><surname>Reis</surname><given-names>T</given-names></name><name><surname>Bruchhaus</surname><given-names>S</given-names></name><name><surname>Vu</surname><given-names>B</given-names></name><name><surname>Bornschlegl</surname><given-names>MX</given-names></name><name><surname>Hemmje</surname><given-names>ML</given-names></name></person-group>. <article-title>Towards modeling AI-based user empowerment for visual big data analysis</article-title>. In: Frommholz I, Liu H, Melucci M, Belkin NJ, Jones GJF, Kando N, et al., editors. <source>Joint Proceedings of the Second Workshop on Bridging the Gap Between Information Science, Information Retrieval and Data Science, and Third Workshop on Evaluation of Personalisation in Information Retrieval, Co-Located with 6th ACM SIGIR Conference on Human Information Interaction and Retrieval (CHIIR 2021); 2021 Mar 19; Canberra, Australia (Virtual Event)</source>. CEUR Workshop Proceedings. Vol. 2863. (2021). p. <fpage>67</fpage>&#x2013;<lpage>75</lpage>. Available at: <ext-link ext-link-type="uri" xlink:href="https://ceur-ws.org/Vol-2863/paper-07.pdf">https://ceur-ws.org/Vol-2863/paper-07.pdf</ext-link></citation></ref>
<ref id="B31"><label>31.</label><citation citation-type="other"><collab>WARIFA Consortium</collab>. <article-title>Warifa</article-title> (<year>2021</year>). <comment>Available at:</comment> <ext-link ext-link-type="uri" xlink:href="https://www.warifa.eu/">https://www.warifa.eu/</ext-link> <comment>(Accessed April 16, 2023)</comment>.</citation></ref>
<ref id="B32"><label>32.</label><citation citation-type="book"><collab>International Organization for Standardization</collab>. <source>ISO 15197:2013. In Vitro Diagnostic Test Systems &#x2013; Requirements for Blood-Glucose Monitoring Systems for Self-Testing in Managing Diabetes Mellitus</source>. <publisher-loc>Geneva</publisher-loc>: <publisher-name>ISO</publisher-name> (<year>2015</year>).</citation></ref>
<ref id="B33"><label>33.</label><citation citation-type="other"><article-title>Python Release Python 3.10.13&#x007C;Python.org</article-title> (<year>2024</year>). <comment>Available at:</comment> <ext-link ext-link-type="uri" xlink:href="https://www.python.org/downloads/release/python-31013/">https://www.python.org/downloads/release/python-31013/</ext-link> <comment>(Accessed January 24, 2024)</comment>.</citation></ref>
<ref id="B34"><label>34.</label><citation citation-type="other"><article-title>TensorFlow. API documentation: TensorFlow v2.10.1. Google (2022)</article-title>. <comment>Available at</comment>: <ext-link ext-link-type="uri" xlink:href="https://www.tensorflow.org/versions/r2.10/api_docs">https://www.tensorflow.org/versions/r2.10/api_docs</ext-link> <comment>(Accessed January 24, 2024)</comment>.</citation></ref>
<ref id="B35"><label>35.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sutskever</surname><given-names>I</given-names></name><name><surname>Vinyals</surname><given-names>O</given-names></name><name><surname>Le</surname><given-names>QV</given-names></name></person-group>. <article-title>Sequence to sequence learning with neural networks</article-title>. <source>Adv Neural Inf Process Syst</source>. (<year>2014</year>) <volume>4</volume>:<fpage>3104</fpage>&#x2013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.48550/arXiv.1409.3215</pub-id></citation></ref>
<ref id="B36"><label>36.</label><citation citation-type="confproc"><person-group person-group-type="author"><name><surname>Du</surname><given-names>X</given-names></name><name><surname>Zhang</surname><given-names>H</given-names></name><name><surname>Van Nguyen</surname><given-names>H</given-names></name><name><surname>Han</surname><given-names>Z</given-names></name></person-group>. <article-title>Stacked LSTM deep learning model for traffic prediction in vehicle-to-vehicle communication</article-title>. In: <source>Proceedings of the 86th IEEE Vehicular Technology Conference (VTC-Fall); 2017 Sep 24&#x2013;27; Toronto, ON, Canada</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>IEEE</publisher-name> (<year>2017</year>). p. <fpage>1</fpage>&#x2013;<lpage>5</lpage>.</citation></ref>
<ref id="B37"><label>37.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Van Cauter</surname><given-names>E</given-names></name><name><surname>Polonsky</surname><given-names>KS</given-names></name><name><surname>Scheen</surname><given-names>AJ</given-names></name></person-group>. <article-title>Roles of circadian rhythmicity and sleep in human glucose regulation&#x002A;</article-title>. <source>Endocr Rev</source>. (<year>1997</year>) <volume>18</volume>(<issue>5</issue>):<fpage>716</fpage>&#x2013;<lpage>38</lpage>. <pub-id pub-id-type="doi">10.1210/edrv.18.5.0317</pub-id><pub-id pub-id-type="pmid">9331550</pub-id></citation></ref>
<ref id="B38"><label>38.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>Z</given-names></name><name><surname>Liu</surname><given-names>F</given-names></name><name><surname>Yang</surname><given-names>W</given-names></name><name><surname>Peng</surname><given-names>S</given-names></name><name><surname>Zhou</surname><given-names>J</given-names></name></person-group>. <article-title>A survey of convolutional neural networks: analysis, applications, and prospects</article-title>. <source>IEEE Trans Neural Netw Learn Syst</source>. (<year>2022</year>) <volume>33</volume>(<issue>12</issue>):<fpage>6999</fpage>&#x2013;<lpage>7019</lpage>. <pub-id pub-id-type="doi">10.1109/TNNLS.2021.3084827</pub-id><pub-id pub-id-type="pmid">34111009</pub-id></citation></ref>
<ref id="B39"><label>39.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hochreiter</surname><given-names>S</given-names></name><name><surname>Schmidhuber</surname><given-names>J</given-names></name></person-group>. <article-title>Long short-term memory</article-title>. <source>Neural Comput</source>. (<year>1997</year>) <volume>9</volume>(<issue>8</issue>):<fpage>1735</fpage>&#x2013;<lpage>80</lpage>. <pub-id pub-id-type="doi">10.1162/neco.1997.9.8.1735</pub-id><pub-id pub-id-type="pmid">9377276</pub-id></citation></ref>
<ref id="B40"><label>40.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>De Paoli</surname><given-names>B</given-names></name><name><surname>D&#x2019;Antoni</surname><given-names>F</given-names></name><name><surname>Merone</surname><given-names>M</given-names></name><name><surname>Pieralice</surname><given-names>S</given-names></name><name><surname>Piemonte</surname><given-names>V</given-names></name><name><surname>Pozzilli</surname><given-names>P.</given-names></name></person-group> <article-title>Blood glucose level forecasting on type-1-diabetes subjects during physical activity: a comparative analysis of different learning techniques</article-title>. <source>Bioengineering</source>. (<year>2021</year>) <volume>8</volume>(<issue>6</issue>):<fpage>72</fpage>. <pub-id pub-id-type="doi">10.3390/bioengineering8060072</pub-id><pub-id pub-id-type="pmid">34073433</pub-id></citation></ref>
<ref id="B41"><label>41.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Baldi</surname><given-names>P</given-names></name><name><surname>Sadowski</surname><given-names>P</given-names></name></person-group>. <article-title>Understanding dropout</article-title>. <source>Adv Neural Inf Process Syst</source>. (<year>2013</year>) <volume>26</volume>:<fpage>2814</fpage>&#x2013;<lpage>22</lpage>.</citation></ref>
<ref id="B42"><label>42.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hawkins</surname><given-names>DM</given-names></name></person-group>. <article-title>The problem of overfitting</article-title>. <source>J Chem Inf Comput Sci</source>. (<year>2004</year>) <volume>44</volume>(<issue>1</issue>):<fpage>1</fpage>&#x2013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.1021/ci0342472</pub-id><pub-id pub-id-type="pmid">14741005</pub-id></citation></ref>
<ref id="B43"><label>43.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Renna</surname><given-names>F</given-names></name><name><surname>Oliveira</surname><given-names>J</given-names></name><name><surname>Coimbra</surname><given-names>MT</given-names></name></person-group>. <article-title>Deep convolutional neural networks for heart sound segmentation</article-title>. <source>IEEE J Biomed Health Inform</source>. (<year>2019</year>) <volume>23</volume>(<issue>6</issue>):<fpage>2435</fpage>&#x2013;<lpage>45</lpage>. <pub-id pub-id-type="doi">10.1109/JBHI.2019.2894222</pub-id><pub-id pub-id-type="pmid">30668487</pub-id></citation></ref>
<ref id="B44"><label>44.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Rubin-Falcone</surname><given-names>H</given-names></name><name><surname>Fox</surname><given-names>I</given-names></name><name><surname>Wiens</surname><given-names>J</given-names></name></person-group>. <article-title>Deep residual time-series forecasting: application to blood glucose prediction</article-title>. In: <source>Proceedings of the 5th International Workshop on Knowledge Discovery in Healthcare Data (KDH 2020) at ECAI; 2020 Sep 4; Santiago de Compostela, Spain</source>. CEUR Workshop Proceedings. Vol. 2675. <publisher-loc>Aachen</publisher-loc>: CEUR-WS.org (<year>2020</year>). p. <fpage>9</fpage>&#x2013;<lpage>16</lpage>.</citation></ref>
<ref id="B45"><label>45.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname><given-names>C</given-names></name><name><surname>Veh&#x00ED;</surname><given-names>J</given-names></name><name><surname>Avari</surname><given-names>P</given-names></name><name><surname>Reddy</surname><given-names>M</given-names></name><name><surname>Oliver</surname><given-names>N</given-names></name><name><surname>Georgiou</surname><given-names>P</given-names></name><etal/></person-group> <article-title>Long-term glucose forecasting using a physiological model and deconvolution of the continuous glucose monitoring signal</article-title>. <source>Sensors</source>. (<year>2019</year>) <volume>19</volume>(<issue>19</issue>):<fpage>4338</fpage>. <pub-id pub-id-type="doi">10.3390/s19194338</pub-id><pub-id pub-id-type="pmid">31597288</pub-id></citation></ref>
<ref id="B46"><label>46.</label><citation citation-type="book"><collab>Docker Inc</collab>. <source>Docker: accelerated container application development</source>. <publisher-loc>San Francisco, CA</publisher-loc>: <publisher-name>Docker Inc</publisher-name>. (<year>2013</year>). <comment>Available at:</comment> <ext-link ext-link-type="uri" xlink:href="https://www.docker.com/">https://www.docker.com/</ext-link> <comment>(Accessed June 26, 2024)</comment>.</citation></ref>
<ref id="B47"><label>47.</label><citation citation-type="confproc"><person-group person-group-type="author"><name><surname>Zhuang</surname><given-names>F</given-names></name><name><surname>Qi</surname><given-names>Z</given-names></name><name><surname>Duan</surname><given-names>K</given-names></name><name><surname>Xi</surname><given-names>D</given-names></name><name><surname>Zhu</surname><given-names>Y</given-names></name><name><surname>Zhu</surname><given-names>H</given-names></name><etal/></person-group> <article-title>A comprehensive survey on transfer learning</article-title>. <source>Proc IEEE</source>. (<year>2021</year>) <volume>109</volume>(<issue>1</issue>):<fpage>43</fpage>&#x2013;<lpage>76</lpage>. <pub-id pub-id-type="doi">10.1109/JPROC.2020.3004555</pub-id></citation></ref>
<ref id="B48"><label>48.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>El Idrissi</surname><given-names>T</given-names></name><name><surname>Idri</surname><given-names>A</given-names></name></person-group>. <article-title>Deep learning for blood glucose prediction: CNN vs. LSTM</article-title>. In: Gervasi O, Murgante B, Misra S, Garau C, Ble&#x010D;i&#x0107; I, Taniar D, et al., editors. <source>Computational Science and Its Applications &#x2013; ICCSA 2020</source>. Lecture Notes in Computer Science Vol. 12250. <publisher-loc>Cham</publisher-loc>: <publisher-name>Springer</publisher-name> (<year>2020</year>). p. <fpage>385</fpage>&#x2013;<lpage>400</lpage>. <pub-id pub-id-type="doi">10.1007/978-3-030-58802-1_28</pub-id></citation></ref>
<ref id="B49"><label>49.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Haus</surname><given-names>E</given-names></name></person-group>. <article-title>Chronobiology in the endocrine system</article-title>. <source>Adv Drug Deliv Rev</source>. (<year>2007</year>) <volume>59</volume>:<fpage>985</fpage>&#x2013;<lpage>1014</lpage><volume>.</volume> <pub-id pub-id-type="doi">10.1016/j.addr.2007.01.001</pub-id><pub-id pub-id-type="pmid">17804113</pub-id></citation></ref>
<ref id="B50"><label>50.</label><citation citation-type="confproc"><person-group person-group-type="author"><name><surname>Moscoso-Vasquez</surname><given-names>M</given-names></name><name><surname>Colmegna</surname><given-names>P</given-names></name><name><surname>Sanchez-Pena</surname><given-names>RS</given-names></name></person-group>. <article-title>Intra-patient dynamic variations in type 1 diabetes: a review</article-title>. In: <conf-name>2016 IEEE Conference on Control Applications, CCA 2016</conf-name>. <publisher-name>Institute of Electrical and Electronics Engineers Inc.</publisher-name> (<year>2016</year>). p. <fpage>416</fpage>&#x2013;<lpage>21</lpage>.</citation></ref>
<ref id="B51"><label>51.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shilo</surname><given-names>S</given-names></name><name><surname>Keshet</surname><given-names>A</given-names></name><name><surname>Rossman</surname><given-names>H</given-names></name><name><surname>Godneva</surname><given-names>A</given-names></name><name><surname>Talmor-Barkan</surname><given-names>Y</given-names></name><name><surname>Aviv</surname><given-names>Y</given-names></name><etal/></person-group> <article-title>Continuous glucose monitoring and intrapersonal variability in fasting glucose</article-title>. <source>Nat Med</source>. (<year>2024</year>) <volume>30</volume>(<issue>5</issue>):<fpage>1424</fpage>&#x2013;<lpage>31</lpage>. <pub-id pub-id-type="doi">10.1038/s41591-024-02908-9</pub-id><pub-id pub-id-type="pmid">38589602</pub-id></citation></ref>
<ref id="B52"><label>52.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>SCY</given-names></name><name><surname>Nickel</surname><given-names>G</given-names></name><name><surname>Venkatesh</surname><given-names>KP</given-names></name><name><surname>Raza</surname><given-names>MM</given-names></name><name><surname>Kvedar</surname><given-names>JC</given-names></name></person-group>. <article-title>AI-based diabetes care: risk prediction models and implementation concerns</article-title>. <source>NPJ Digit Med</source>. (<year>2024</year>) <volume>7</volume>(<issue>1</issue>):<fpage>1</fpage>&#x2013;<lpage>2</lpage>. <pub-id pub-id-type="doi">10.1038/s41746-024-01034-7</pub-id><pub-id pub-id-type="pmid">38172429</pub-id></citation></ref>
<ref id="B53"><label>53.</label><citation citation-type="confproc"><person-group person-group-type="author"><name><surname>Marling</surname><given-names>C</given-names></name><name><surname>Bunescu</surname><given-names>R</given-names></name></person-group>. <article-title>The ohioT1DM dataset for blood glucose level prediction: update 2020</article-title>. In: <conf-name>CEUR Workshop Proceedings</conf-name>; <publisher-name>CEUR-WS</publisher-name> (<year>2020</year>). p. <fpage>71</fpage>&#x2013;<lpage>4</lpage>.</citation></ref>
<ref id="B54"><label>54.</label><citation citation-type="confproc"><person-group person-group-type="author"><name><surname>Oreshkin</surname><given-names>BN</given-names></name><name><surname>Carpov</surname><given-names>D</given-names></name><name><surname>Chapados</surname><given-names>N</given-names></name><name><surname>Bengio</surname><given-names>Y</given-names></name></person-group>. <article-title>N-BEATS: neural basis expansion analysis for interpretable time series forecasting</article-title>. In: <conf-name>Proceedings of the 8th International Conference on Learning Representations (ICLR 2020); 2020 Apr 26&#x2013;30; Addis Ababa, Ethiopia</conf-name>. Published online. Available at: <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/1905.10437v4">https://arxiv.org/abs/1905.10437v4</ext-link></citation></ref>
<ref id="B55"><label>55.</label><citation citation-type="other"><person-group person-group-type="author"><name><surname>Chen</surname><given-names>SA</given-names></name><name><surname>Li</surname><given-names>CL</given-names></name><name><surname>Yoder</surname><given-names>NC</given-names></name><name><surname>Cloud</surname><given-names>G</given-names></name><name><surname>Research</surname><given-names>AI</given-names></name><name><surname>Ar&#x0131;k</surname><given-names>S&#x00D6;</given-names></name><etal/></person-group> <article-title>TSMixer: an All-MLP architecture for time series forecasting</article-title> (<year>2023</year>). <comment>Available at:</comment> <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/2303.06053v5">https://arxiv.org/abs/2303.06053v5</ext-link> <comment>(Accessed June 26, 2024)</comment>.</citation></ref>
<ref id="B56"><label>56.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bergenstal</surname><given-names>RM</given-names></name><name><surname>Kerr</surname><given-names>MSD</given-names></name><name><surname>Roberts</surname><given-names>GJ</given-names></name><name><surname>Souto</surname><given-names>D</given-names></name><name><surname>Nabutovsky</surname><given-names>Y</given-names></name><name><surname>Hirsch</surname><given-names>IB</given-names></name></person-group>. <article-title>Flash CGM is associated with reduced diabetes events and hospitalizations in insulin-treated type 2 diabetes</article-title>. <source>J Endocr Soc</source>. (<year>2021</year>) <volume>5</volume>(<issue>4</issue>):<fpage>1</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1210/jendso/bvab013</pub-id></citation></ref>
<ref id="B57"><label>57.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shiwani</surname><given-names>MA</given-names></name><name><surname>Chico</surname><given-names>TJA</given-names></name><name><surname>Ciravegna</surname><given-names>F</given-names></name><name><surname>Mihaylova</surname><given-names>L</given-names></name></person-group>. <article-title>Continuous monitoring of health and mobility indicators in patients with cardiovascular disease: a review of recent technologies</article-title>. <source>Sensors</source>. (<year>2023</year>) <volume>23</volume>(<issue>12</issue>):<fpage>5752</fpage>. <pub-id pub-id-type="doi">10.3390/s23125752</pub-id><pub-id pub-id-type="pmid">37420916</pub-id></citation></ref>
<ref id="B58"><label>58.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bartolome</surname><given-names>A</given-names></name><name><surname>Prioleau</surname><given-names>T</given-names></name></person-group>. <article-title>A computational framework for discovering digital biomarkers of glycemic control</article-title>. <source>NPJ Digit Med</source>. (<year>2022</year>) <volume>5</volume>(<issue>1</issue>):<fpage>1</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1038/s41746-022-00656-z</pub-id><pub-id pub-id-type="pmid">35013539</pub-id></citation></ref>
<ref id="B59"><label>59.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname><given-names>Y</given-names></name><name><surname>Esmaeilzadeh</surname><given-names>P</given-names></name></person-group>. <article-title>Generative AI in medical practice: in-depth exploration of privacy and security challenges</article-title>. <source>J Med Internet Res</source>. (<year>2024</year>) <volume>26</volume>:<fpage>e53008</fpage>. <pub-id pub-id-type="doi">10.2196/53008</pub-id><pub-id pub-id-type="pmid">38457208</pub-id></citation></ref>
<ref id="B60"><label>60.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vela</surname><given-names>D</given-names></name><name><surname>Sharp</surname><given-names>A</given-names></name><name><surname>Zhang</surname><given-names>R</given-names></name><name><surname>Nguyen</surname><given-names>T</given-names></name><name><surname>Hoang</surname><given-names>A</given-names></name><name><surname>Pianykh</surname><given-names>OS</given-names></name></person-group>. <article-title>Temporal quality degradation in AI models</article-title>. <source>Sci Rep</source>. (<year>2022</year>) <volume>12</volume>(<issue>1</issue>):<fpage>1</fpage>&#x2013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.1038/s41598-022-15245-z</pub-id><pub-id pub-id-type="pmid">34992227</pub-id></citation></ref>
<ref id="B61"><label>61.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rieke</surname><given-names>N</given-names></name><name><surname>Hancox</surname><given-names>J</given-names></name><name><surname>Li</surname><given-names>W</given-names></name><name><surname>Milletar&#x00EC;</surname><given-names>F</given-names></name><name><surname>Roth</surname><given-names>HR</given-names></name><name><surname>Albarqouni</surname><given-names>S</given-names></name><etal/></person-group> <article-title>The future of digital health with federated learning</article-title>. <source>NPJ Digit Med</source>. <year>2020</year> <volume>3</volume>(<issue>1</issue>):<fpage>1</fpage>&#x2013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1038/s41746-020-00323-1</pub-id><pub-id pub-id-type="pmid">31934645</pub-id></citation></ref></ref-list>
</back>
</article>