<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Artif. Intell.</journal-id>
<journal-title>Frontiers in Artificial Intelligence</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Artif. Intell.</abbrev-journal-title>
<issn pub-type="epub">2624-8212</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/frai.2024.1487335</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Artificial Intelligence</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Predicting clinical trial success for <italic>Clostridium difficile</italic> infections based on preclinical data</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Li</surname> <given-names>Fangzhou</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="author-notes" rid="fn0001"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2853936/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Youn</surname> <given-names>Jason</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="author-notes" rid="fn0001"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1137619/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Millsop</surname> <given-names>Christian</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Tagkopoulos</surname> <given-names>Ilias</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1035474/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Department of Computer Science, University of California, Davis</institution>, <addr-line>Davis, CA</addr-line>, <country>United States</country></aff>
<aff id="aff2"><sup>2</sup><institution>Genome Center, University of California, Davis</institution>, <addr-line>Davis, CA</addr-line>, <country>United States</country></aff>
<aff id="aff3"><sup>3</sup><institution>USDA/NSF AI Institute for Next Generation Food Systems, University of California, Davis</institution>, <addr-line>Davis, CA</addr-line>, <country>United States</country></aff>
<author-notes>
<fn fn-type="edited-by" id="fn0002">
<p>Edited by: Tse-Yen Yang, Asia University, Taiwan</p>
</fn>
<fn fn-type="edited-by" id="fn0003">
<p>Reviewed by: TaChen Chen, Nihon Pharmaceutical University, Japan</p>
<p>Hsin-Yi Lo, China Medical University (Taiwan), Taiwan</p>
</fn>
<corresp id="c001">&#x002A;Correspondence: Ilias Tagkopoulos, <email>itagkopoulos@ucdavis.edu</email></corresp>
<fn fn-type="equal" id="fn0001">
<p><sup>&#x2020;</sup>These authors have contributed equally to this work</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>09</day>
<month>10</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>7</volume>
<elocation-id>1487335</elocation-id>
<history>
<date date-type="received">
<day>27</day>
<month>08</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>26</day>
<month>09</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2024 Li, Youn, Millsop and Tagkopoulos.</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Li, Youn, Millsop and Tagkopoulos</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Preclinical models are ubiquitous and essential for drug discovery, yet our understanding of how well they translate to clinical outcomes is limited. In this study, we investigate the translational success of treatments for <italic>Clostridium difficile</italic> infection from animal models to human patients. Our analysis shows that only 36% of the preclinical and clinical experiment pairs result in translation success. Univariate analysis shows that the sustained response endpoint is correlated with translation failure (SRC&#x2009;=&#x2009;-0.20, <italic>p</italic>-value&#x2009;=&#x2009;1.53 &#x00D7; 10<sup>&#x2212;54</sup>), and explainability analysis of multi-variate random forest models shows that both sustained response endpoint and subject age are negative predictors of translation success. We have developed a recommendation system to help plan the right preclinical study given factors such as drug dosage, bacterial dosage, and preclinical/clinical endpoint. With an accuracy of 0.76 (F1 score of 0.71) and by using only 7 features (out of 68 total), the proposed system boosts translational efficiency by 25%. The method presented can extend to any disease and can serve as a preclinical to clinical translation decision support system to accelerate drug discovery and de-risk clinical outcomes.</p>
</abstract>
<kwd-group>
<kwd>machine learning</kwd>
<kwd>translational research</kwd>
<kwd>drug discovery</kwd>
<kwd>clinical trial</kwd>
<kwd>recommendation system</kwd>
</kwd-group>
<counts>
<fig-count count="4"/>
<table-count count="1"/>
<equation-count count="3"/>
<ref-count count="45"/>
<page-count count="9"/>
<word-count count="6080"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Medicine and Public Health</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<title>Introduction</title>
<p><italic>Clostridium difficile</italic> is a spore-forming anaerobic bacteria widely distributed in the intestinal tract of humans and animals and in various environmental contexts (<xref ref-type="bibr" rid="ref35">Smits et al., 2016</xref>). Over the past decade, the frequency and severity of <italic>C. difficile</italic> infection (CDI) have been increasing worldwide to become a leading nosocomial (hospital-acquired) pathogen (<xref ref-type="bibr" rid="ref9">Czepiel et al., 2019</xref>). It is estimated to affect approximately 3&#x2009;million individuals worldwide every year (<xref ref-type="bibr" rid="ref8">Cole and Stahl, 2015</xref>), underscoring its significant public health impact. Although various treatments, such as metronidazole and oral vancomycin (<xref ref-type="bibr" rid="ref44">Zar et al., 2007</xref>; <xref ref-type="bibr" rid="ref16">Johnson et al., 2014</xref>; <xref ref-type="bibr" rid="ref37">Teasley et al., 1983</xref>), have been approved for CDI management, the sustained efficacy, the effectiveness of treatment after the treatment is no longer administered, is low (<xref ref-type="bibr" rid="ref39">Van Giau et al., 2019</xref>). This is particularly concerning given the recurrent nature of CDI (<xref ref-type="bibr" rid="ref8">Cole and Stahl, 2015</xref>; <xref ref-type="bibr" rid="ref27">McFarland et al., 1999</xref>), where the sustainability of treatment efficacy (the ability to prevent recurrence post-therapy) is crucial.</p>
<p>A predominant challenge in the development of treatments for <italic>Clostridium difficile</italic>, as with many diseases, lies in the limited rate of translational success from preclinical to clinical stages. For example, the chance of a potential drug candidate identified in the preclinical trials demonstrating efficacy in human studies and ultimately receiving approval is a mere 0.1% (<xref ref-type="bibr" rid="ref32">Seyhan, 2019</xref>). Therefore, the development of a new drug is a time-consuming and costly process that often takes an average of 13&#x2009;years and costs approximately US$1&#x2009;billion (<xref ref-type="bibr" rid="ref6">Ciociola et al., 2014</xref>) from the preclinical testing stage to FDA approval. The major causes for such translation failures are the lack of appropriate animal models for predicting the efficacy of the drug in humans (<xref ref-type="bibr" rid="ref32">Seyhan, 2019</xref>; <xref ref-type="bibr" rid="ref28">Paul et al., 2010</xref>), concerns for the efficacy and safety of the drugs (<xref ref-type="bibr" rid="ref19">Kola and Landis, 2004</xref>), poor study design, ineffective site selection, poor recruitment, patient burden, and poor trial execution (<xref ref-type="bibr" rid="ref12">Fogel, 2018</xref>). Efforts to enhance translational success have included the use of humanized animals, which exhibit more human-like responses to medical interventions (<xref ref-type="bibr" rid="ref34">Shultz et al., 2007</xref>), and the application of biomarkers to reduce subjectivity in evaluating drug efficacy and safety (<xref ref-type="bibr" rid="ref43">Yu, 2011</xref>). Machine learning-based approaches (<xref ref-type="bibr" rid="ref33">Shah et al., 2019</xref>; <xref ref-type="bibr" rid="ref38">Toh et al., 2019</xref>; <xref ref-type="bibr" rid="ref14">Gayvert et al., 2016</xref>) have also been explored, predominantly focusing on attrition rates across different phases of clinical trials. However, these approaches often lack explainability due to the &#x2018;black box&#x2019; nature of the models employed, interfering with their application in decision-making with high stakes (<xref ref-type="bibr" rid="ref22">Lipton, 2017</xref>). Although machine learning models have shown promising results in other areas of life sciences (<xref ref-type="bibr" rid="ref25">Lysenko et al., 2018</xref>; <xref ref-type="bibr" rid="ref42">Wang et al., 2020</xref>; <xref ref-type="bibr" rid="ref10">Eetemadi and Tagkopoulos, 2019</xref>), their application in bridging the gap between preclinical and clinical outcomes is hindered by a scarcity of expert-curated and harmonized datasets (<xref ref-type="bibr" rid="ref2">Austin, 2021</xref>). This limitation is particularly pronounced in the context of <italic>C. difficile</italic>, where the complexity of the disease and its treatment modalities necessitates highly specialized and accurate data for effective model training and validation.</p>
<p>In this study, to address the data scarcity, we manually curate the Animal-to-Human (A2H) translation dataset by extracting and pairing preclinical and clinical data for <italic>C. difficile</italic> infections from the scientific literature and <ext-link xlink:href="https://ClinicalTrials.gov" ext-link-type="uri">ClinicalTrials.gov</ext-link>, respectively. Using our A2H dataset, we train a machine learning-based classifier to predict translational success (<xref ref-type="fig" rid="fig1">Figure 1a</xref>). Next, to address model interpretability, we apply an explainable AI method (<xref ref-type="bibr" rid="ref24">Lundberg and Lee, 2017</xref>), and then we expand this predictor to a recommendation system (<xref ref-type="fig" rid="fig1">Figure 1b</xref>).</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>Overview of the preclinical recommendation system. (a) We collect data from publicly available preclinical and clinical trial information about <italic>Clostridium difficile</italic> infection. This dataset, designated as A2H, is constructed by pairing the preclinical trial with the clinical trial that shares the same drug. A binary classification label is applied to each pair, where a translation is successful (label 1) if the preclinical survival rates and clinical recovery rates are within a threshold <inline-formula>
<mml:math id="M1">
<mml:mi>&#x03B4;</mml:mi>
</mml:math>
</inline-formula>. Then, a machine learning pipeline chooses the best combination of feature selection, missing value imputation, outlier detection, and classifier. We report the model performance and feature interpretation and predictions. (b) For any specified clinical trial of interest, our system computes a translation score for each candidate preclinical trial. This score quantitatively assesses the potential for successful translation. The preclinical trial that emerges with the highest translation score is then preferentially chosen to inform the design of the ensuing preclinical study.</p>
</caption>
<graphic xlink:href="frai-07-1487335-g001.tif"/>
</fig>
</sec>
<sec sec-type="materials|methods" id="sec2">
<title>Materials and methods</title>
<sec id="sec3">
<title>Raw data acquisition</title>
<p>Clinical trial data about <italic>C. difficile</italic> infection (CDI) were collected from <ext-link xlink:href="https://ClinicalTrials.gov" ext-link-type="uri"><italic>ClinicalTrials.gov</italic></ext-link>, a comprehensive database of privately and publicly funded clinical studies. This study focused exclusively on completed interventional clinical trials that have published results to ensure the reliability and validity of the data. Parallel to clinical trial data collection, a thorough search was conducted on PubMed to identify publications that tested the same intervention (i.e., drug candidate) in an animal model as one of the clinical trials in our collection. Note that within the scope of a single trial, multiple experimental arms may be present, each contributing to the collective dataset. Here, an &#x2018;arm&#x2019; is delineated as a cohort or subset of subjects receiving a particular therapeutic regimen (<xref ref-type="bibr" rid="ref41">Ventz et al., 2018</xref>; <xref ref-type="bibr" rid="ref7">Clinical and Designs, 2019</xref>). For instance, if a trial investigates two distinct treatment dosages, each dosage arm is a cohort that can have multiple individuals (or samples; animals for preclinical and humans for clinical studies, respectively). This resulted in a preclinical dataset of 480 arms from 43 preclinical trials, collectively consisting of 3 animal species, 60 interventions (drug candidates), and 29 variables. Similarly, the clinical dataset has 158 arms from 52 clinical trials, collectively consisting of 53 interventions (drug candidates) and 21 total variables. The raw data and variable description can be found in <xref rid="SM1" ref-type="supplementary-material">Supplementary Data 1</xref>.</p>
</sec>
<sec id="sec4">
<title>Data compendium</title>
<p>Due to the different interests in the endpoints measured in animal and human subjects, the number of preclinical and clinical trials that share the same endpoints is limited. For example, the survival rate is predominantly measured in preclinical trials, while the recovery rate is more often used in clinical trials for CDI. The survival rate indicates the ratio of living subjects, while the recovery rate indicates the ratio of healthy patients in the group at the point of measure. These two rates both reflect drug efficacy (<xref ref-type="bibr" rid="ref45">Zhuang et al., 2009</xref>), making them more comparable and relevant for evaluating the effectiveness of treatments in both preclinical and clinical trials. In this section, we describe a strategy to derive translation outcome using these survival and recovery rates.</p>
<p>For preclinical studies, 480 arms with 27 variables were gathered, including specifics of animal (e.g., species, strain, sex, age, weight), disease model (e.g., administration sequence, disease strain), and drug (e.g., dosing, duration). For clinical studies, 272 arms with 15 variables were collected, encompassing aspects like dosage details, intervention class, therapeutic approach, and participant demographics. We then paired the preclinical and clinical trial arms that tested the same intervention (drug candidate) to construct an A2H dataset, which consists of 6,918 samples and 42 variables (27 from preclinical trials and 15 from clinical trials) after data cleaning and dropping 8 variables from the raw datasets (<xref rid="SM1" ref-type="supplementary-material">Supplementary Information Section 1.1</xref>; <xref rid="SM1" ref-type="supplementary-material">Supplementary Data 2</xref>). To analytically assign the binary dependent variable, we first calculated the difference between recovery and survival rates, denoted as <inline-formula>
<mml:math id="M2">
<mml:mi>&#x03B4;</mml:mi>
</mml:math>
</inline-formula> (<xref ref-type="disp-formula" rid="EQ1">Equation 1</xref>), for each sample in the paired dataset as follows:</p>
<disp-formula id="EQ1">
<label>(1)</label>
<mml:math id="M3">
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1.0</mml:mn>
<mml:mo>&#x2264;</mml:mo>
<mml:mi>&#x03B4;</mml:mi>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mi>r</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mi>s</mml:mi>
</mml:msub>
<mml:mo>&#x2264;</mml:mo>
<mml:mn>1.0</mml:mn>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math id="M4">
<mml:mrow>
<mml:mn>0.0</mml:mn>
<mml:mo>&#x2264;</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mi>s</mml:mi>
</mml:msub>
<mml:mo>&#x2264;</mml:mo>
<mml:mn>1.0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> is the survival rate for animal subjects in the preclinical study, and <inline-formula>
<mml:math id="M5">
<mml:mrow>
<mml:mn>0.0</mml:mn>
<mml:mo>&#x2264;</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mi>r</mml:mi>
</mml:msub>
<mml:mo>&#x2264;</mml:mo>
<mml:mn>1.0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> is the recovery rate for human subjects in the clinical study. We then fit a normal distribution (<xref ref-type="disp-formula" rid="EQ2">Equation 2</xref>) to these deltas as</p>
<disp-formula id="EQ2">
<label>(2)</label>
<mml:math id="M6">
<mml:mrow>
<mml:mi>&#x03B4;</mml:mi>
<mml:mo>~</mml:mo>
<mml:mi>N</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>&#x03BC;</mml:mi>
<mml:mi mathvariant="normal">,</mml:mi>
<mml:mi>&#x03C3;</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where mean (<inline-formula>
<mml:math id="M7">
<mml:mi>&#x03BC;</mml:mi>
</mml:math>
</inline-formula>) and standard deviation (<inline-formula>
<mml:math id="M8">
<mml:mi>&#x03C3;</mml:mi>
</mml:math>
</inline-formula>) estimate the standard distribution of <inline-formula>
<mml:math id="M9">
<mml:mi>&#x03B4;</mml:mi>
</mml:math>
</inline-formula>. We assigned the binary label as follows:</p>
<disp-formula id="EQ3">
<label>(3)</label>
<mml:math id="M10">
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mspace width="thickmathspace"/>
<mml:mfenced>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>l</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi mathvariant="normal">&#x00A0;</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>s</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>:</mml:mo>
<mml:mo>|</mml:mo>
<mml:mi>&#x03B4;</mml:mi>
<mml:mo>|</mml:mo>
<mml:mo>&#x003C;</mml:mo>
<mml:mi>c</mml:mi>
<mml:mo>&#x2217;</mml:mo>
<mml:mi>&#x03C3;</mml:mi>
<mml:mo>,</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mspace width="thickmathspace"/>
<mml:mn>0</mml:mn>
<mml:mspace width="thickmathspace"/>
<mml:mfenced>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>l</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi mathvariant="normal">&#x00A0;</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>l</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>:</mml:mo>
<mml:mo>|</mml:mo>
<mml:mi>&#x03B4;</mml:mi>
<mml:mo>|</mml:mo>
<mml:mo>&#x2265;</mml:mo>
<mml:mi>c</mml:mi>
<mml:mo>&#x2217;</mml:mo>
<mml:mi>&#x03C3;</mml:mi>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math id="M12">
<mml:mi>c</mml:mi>
</mml:math>
</inline-formula> is a coefficient that controls the strictness of the translation success (<xref ref-type="disp-formula" rid="EQ3">Equation 3</xref>). We visualized our performance statistics using the A2H dataset with labels assigned with <inline-formula>
<mml:math id="M13">
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>0.5</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>. However, different choices of <inline-formula>
<mml:math id="M14">
<mml:mi>c</mml:mi>
</mml:math>
</inline-formula> were also analyzed and reported (<xref rid="SM1" ref-type="supplementary-material">Supplementary Figure 1</xref>).</p>
</sec>
<sec id="sec5">
<title>Model selection</title>
<p>To find the most predictive machine learning model for our preclinical-to-clinical translation, we implemented a model selection pipeline that chooses the best data preprocessing combination and classifier. The categorical variables were transformed into input features applicable to machine learning using one-hot encoding. The pipeline includes, in the order specified, 2 feature scaling [Standard (<xref ref-type="bibr" rid="ref29">Pedregosa et al., 2011</xref>) and MinMax (<xref ref-type="bibr" rid="ref29">Pedregosa et al., 2011</xref>)], 1 missing value imputation (MVI) method [Simple (<xref ref-type="bibr" rid="ref29">Pedregosa et al., 2011</xref>)], 1 oversampling (OS) [SMOTE (<xref ref-type="bibr" rid="ref5">Chawla et al., 2002</xref>)], and 3 classifiers (CLS) [random forests (<xref ref-type="bibr" rid="ref4">Breiman, 2001</xref>), AdaBoost (<xref ref-type="bibr" rid="ref13">Freund and Schapire, 1997</xref>), MLP (<xref ref-type="bibr" rid="ref15">Hinton, 1990</xref>)]. We rigorously tested each possible permutation of these preprocessing steps combined with a classifier using a 5-fold cross-validation approach to ensure robust evaluation, where each split was stratified, and samples from the same preclinical and clinical pair were grouped while splitting (<xref rid="SM1" ref-type="supplementary-material">Supplementary Information Section 1.2</xref>). Moreover, a grid search was performed on the classifiers to find the optimal hyperparameters using the validation set. Ultimately, the model candidate with the highest F1 score was selected as the best model. We have provided more in detailed information in <xref rid="SM1" ref-type="supplementary-material">Supplementary Information Section 1.3</xref>.</p>
</sec>
<sec id="sec6">
<title>Model interpretability</title>
<p>To increase the interpretability of the model, we applied the Shapley Additive Explanations (SHAP) (<xref ref-type="bibr" rid="ref24">Lundberg and Lee, 2017</xref>) algorithm. The greater the magnitude of the SHAP value of a feature, the more influence that feature has on the model output. SHAP can provide the local explanation for each sample and the global explanation for an entire class by summarizing the overall importance of features across all data points. In this study, we used SHAP to analyze features that are influential in general to determine translation success.</p>
</sec>
</sec>
<sec sec-type="results" id="sec7">
<title>Results</title>
<sec id="sec8">
<title>Experimental features correlated to preclinical to clinical translation success</title>
<p><xref ref-type="fig" rid="fig2">Figure 2a</xref> depicts the spectral biclustering (<xref ref-type="bibr" rid="ref18">Kluger et al., 2003</xref>) of the 5,851 preclinical-clinical pair samples, excluding control intervention and inconvertible unit samples from the original 6,918, across the 68 features after performing one-hot encoding to the original 42 variables. From top to bottom, the fourth and sixth row clusters were associated with the lowest and highest average translation success rates of 0.25 and 0.45, respectively. We found that the row cluster with the lowest average translation success rate differentiated from other clusters due to its unique disease model, which challenged first and then treated animals with clindamycin (<italic>p</italic>-value&#x003C;4.77 &#x00D7; 10<sup>&#x2212;122</sup>). Similarly, the cluster with the highest average translation success rate had adopted <italic>C. difficile</italic> strains (e.g., VA11, 2,926, VA5, TTU 614) that were significantly different from those used in other clusters (<italic>p</italic>-value&#x003C;7.2 &#x00D7; 10<sup>&#x2212;13</sup>). A t-SNE plot for the A2H dataset can also be found in <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure 2</xref>. The distribution of success metrics in both preclinical and clinical trials, specifically focusing on the survival and recovery rates, respectively, are shown in <xref ref-type="fig" rid="fig2">Figures 2b</xref>,<xref ref-type="fig" rid="fig2">c</xref>. These rates are skewed toward the right, partly due to the use of existing drugs like vancomycin and metronidazole as controls in case&#x2013;control studies (<xref ref-type="bibr" rid="ref17">Kaye et al., 2005</xref>). Delta (<inline-formula>
<mml:math id="M15">
<mml:mi>&#x03B4;</mml:mi>
</mml:math>
</inline-formula>), the difference between the recovery rate and survival rate used to assign the target variable (translation success/failure) (see Methods), was modeled using a normal distribution as <inline-formula>
<mml:math id="M16">
<mml:mrow>
<mml:mi>&#x03B4;</mml:mi>
<mml:mo>~</mml:mo>
<mml:mi>N</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mn>0.09</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>0.41</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> (<xref ref-type="fig" rid="fig2">Figure 2d</xref>). We labeled the preclinical and clinical trial pairs (see Methods) that fell within &#x00B1;0.5 standard deviation of <inline-formula>
<mml:math id="M17">
<mml:mrow>
<mml:mi>&#x03B4;</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>0.0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> as &#x2018;translation success.&#x2019; (3,746 samples) and &#x2018;translation failure&#x2019; otherwise (2,105 samples) (<xref ref-type="fig" rid="fig2">Figure 2d</xref>). Spearman correlation coefficient of the features with the dependent variable lists 8 preclinical features as the top 10 most correlated features (<xref ref-type="fig" rid="fig2">Figure 2e</xref>), among which sustained response endpoint (i.e., outcome measured 14&#x2009;days after the treatment) of the clinical trial was most negatively correlated to translation success (SRC&#x2009;=&#x2009;-0.20, <italic>p</italic>-value&#x2009;=&#x2009;1.53 &#x00D7; 10<sup>&#x2212;54</sup>).</p>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>Statistics of the A2H dataset. (a) The spectral biclustering (<italic>K<sub>row</sub></italic> = 8 and <italic>K<sub>col</sub></italic> = 59) plot of the A2H dataset with<inline-formula>
<mml:math id="M20">
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mi>&#x03B4;</mml:mi>
<mml:mo>|</mml:mo>
<mml:mo>&#x003C;</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>.</mml:mo>
<mml:mn>5</mml:mn>
<mml:mi>&#x03C3;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>. The vertical and horizontal red dashed lines separate column and row clusters, respectively. The features on the x-axis with colons in their names represent categorical features after one-hot encoding, and the string after the colon corresponds to the original category when the encoded feature is 1. The features without colons in their names represent numerical features, and the Min-Max scaling is performed on each numerical feature independently. (b) The distribution of the survival rate from the preclinical trial. (c) The distribution of the recovery rate from the clinical trial. (d) The distribution of delta <inline-formula>
<mml:math id="M21">
<mml:mrow>
<mml:mi>&#x03B4;</mml:mi>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mi>r</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mi>s</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, the difference between the clinical trial recovery rate and the preclinical trial survival rate. After fitting the normal distribution <inline-formula>
<mml:math id="M22">
<mml:mrow>
<mml:mi>&#x03B4;</mml:mi>
<mml:mo>~</mml:mo>
<mml:mi>N</mml:mi>
<mml:mfenced>
<mml:mrow>
<mml:mi>&#x03BC;</mml:mi>
<mml:mi mathvariant="normal">,</mml:mi>
<mml:mi>&#x03C3;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
</inline-formula> to the delta, we label the preclinical/clinical trial pairs translation success (label 1) if <inline-formula>
<mml:math id="M23">
<mml:mi>&#x03B4;</mml:mi>
</mml:math>
</inline-formula> lies between <inline-formula>
<mml:math id="M24">
<mml:mrow>
<mml:mo>&#x00B1;</mml:mo>
<mml:mn>0.5</mml:mn>
<mml:mi>&#x03C3;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> around, and translation failure (label 0) otherwise. (e) Top 10 features with the highest absolute Spearman correlation coefficients for thresholds <inline-formula>
<mml:math id="M25">
<mml:mrow>
<mml:mfenced close="|" open="|">
<mml:mi>&#x03B4;</mml:mi>
</mml:mfenced>
<mml:mo>&#x003C;</mml:mo>
<mml:mn>0.5</mml:mn>
<mml:mo>&#x2217;</mml:mo>
<mml:mi>&#x03C3;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, where <inline-formula>
<mml:math id="M26">
<mml:mi>&#x03B4;</mml:mi>
</mml:math>
</inline-formula> is the different between clinical recovery and preclinical survival rates, and <inline-formula>
<mml:math id="M27">
<mml:mi>&#x03C3;</mml:mi>
</mml:math>
</inline-formula> is the standard deviation of <inline-formula>
<mml:math id="M28">
<mml:mi>&#x03B4;</mml:mi>
</mml:math>
</inline-formula>. All the features have adjusted <italic>p</italic>-value &#x003C;0.001.</p>
</caption>
<graphic xlink:href="frai-07-1487335-g002.tif"/>
</fig>
</sec>
<sec id="sec9">
<title>Machine learning models accurately predict translation success</title>
<p>We implemented the model selection pipeline on A2H datasets created using different translation thresholds <inline-formula>
<mml:math id="M29">
<mml:mi>c</mml:mi>
</mml:math>
</inline-formula> (0.0625, 0.125, 0.25, 0.5, 1.0, and 2.0) (see Methods). In every scenario during the cross-validation process, the random forest model emerged as the top-performing classifier (<xref rid="SM1" ref-type="supplementary-material">Supplementary Table 1</xref>). Notably, we observed an improvement of the F1 score when applying SMOTE, especially for thresholds defined by smaller <italic>c</italic> (F1 improved 126.3, 124.9, 39.3, and 2.7% for <italic>c</italic> of 0.0625, 0.125, 0.25, 0.5, respective; <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure 3</xref>). Running the sequential feature selection (<xref ref-type="bibr" rid="ref30">Raschka, 2018</xref>) (SFS) in a parsimonious setting (smallest feature subset that is within one standard error of the best cross-validation F1 score) on the best pipeline with <inline-formula>
<mml:math id="M30">
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>0.5</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> (FS: none, MVI: Simple, OS: SMOTE, CLS: random forest) significantly reduced the required number of features by 76.5% from 68 to 16 with negligible 0.8% performance loss (validation set F1 score decrease from 0.75 to 0.74) as shown in <xref ref-type="fig" rid="fig3">Figure 3a</xref>, where the results for other value of <inline-formula>
<mml:math id="M31">
<mml:mi>c</mml:mi>
</mml:math>
</inline-formula> can be found in <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure 4</xref>. Moreover, we were able to achieve validation set F1 score of 0.73 with only 7 features identified using the Kneedle elbow method (<xref ref-type="bibr" rid="ref31">Satopaa et al., 2011</xref>; <xref ref-type="fig" rid="fig3">Figure 3A</xref>). <xref ref-type="table" rid="tab1">Table 1</xref> further shows the holdout test set performance for different numbers of features for the best model. The best model pipeline for the benchmark A2H dataset (<inline-formula>
<mml:math id="M32">
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>0.5</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>) on the holdout test set achieved a 25% better F1 score than a random baseline (0.69 vs. 0.56, respectively), while AUCPR and AUCROC were 0.68 and 0.82, respectively (<xref ref-type="fig" rid="fig3">Figures 3b</xref>&#x2013;<xref ref-type="fig" rid="fig3">d</xref>). For all six different translation thresholds <inline-formula>
<mml:math id="M33">
<mml:mi>c</mml:mi>
</mml:math>
</inline-formula> except when <inline-formula>
<mml:math id="M34">
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>2.0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>, we had better performance than the random baseline (<xref ref-type="fig" rid="fig3">Figure 3c</xref>; <xref rid="SM1" ref-type="supplementary-material">Supplementary Table 2</xref>).</p>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption>
<p>Prediction performance of the ML translation predictor. (a) Sequential feature selection results for different modes of selection criteria using the validation set. <italic>Best</italic> is the smallest feature subset when the F1 score was the best, <italic>parsimonious</italic> is the smallest feature subset that is within one standard error of the cross-validation performance, and <italic>elbow</italic> is the smallest feature subset based on the Kneedle method. (b) Precision-recall (PR) curves of different <inline-formula>
<mml:math id="M35">
<mml:mi>&#x03B4;</mml:mi>
</mml:math>
</inline-formula> cutoff thresholds on the test set. F1<sub>OOP</sub> denotes the optimal operating point chosen based on the best F1 score. The values above the dots indicate the F1 scores of OOPs. AUCPR stands for the area under the PR curve. (c) Performance metrics of different datasets created with different <inline-formula>
<mml:math id="M36">
<mml:mi>&#x03B4;</mml:mi>
</mml:math>
</inline-formula> cutoff thresholds on the test set. (d) Receiver operating characteristic (ROC) curves of different <inline-formula>
<mml:math id="M37">
<mml:mi>&#x03B4;</mml:mi>
</mml:math>
</inline-formula> cutoff thresholds based on the test set. AUCROC stands for the area under the ROC curve.</p>
</caption>
<graphic xlink:href="frai-07-1487335-g003.tif"/>
</fig>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>The holdout test confusion matrix for the best translation model with <inline-formula>
<mml:math id="M38">
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mi>&#x03B4;</mml:mi>
<mml:mo>|</mml:mo>
<mml:mo>&#x003C;</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>.</mml:mo>
<mml:mn>5</mml:mn>
<mml:mi>&#x03C3;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Model</th>
<th align="center" valign="top">TP</th>
<th align="center" valign="top">FN</th>
<th align="center" valign="top">FP</th>
<th align="center" valign="top">TN</th>
<th align="center" valign="top">Precision</th>
<th align="center" valign="top">Recall</th>
<th align="center" valign="top">F1</th>
<th align="center" valign="top">Accuracy</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Baseline</td>
<td align="center" valign="top">
<bold>430</bold>
</td>
<td align="center" valign="top">
<bold>0</bold>
</td>
<td align="center" valign="top">668</td>
<td align="center" valign="top">0</td>
<td align="char" valign="top" char=".">0.39</td>
<td align="char" valign="top" char=".">
<bold>1</bold>
</td>
<td align="char" valign="top" char=".">0.56</td>
<td align="char" valign="top" char=".">0.39</td>
</tr>
<tr>
<td align="left" valign="top" char="." colspan="9">Random forest</td>
</tr>
<tr>
<td align="left" valign="top">
<list list-type="bullet">
<list-item>
<p>Best (<italic>K</italic>&#x2009;=&#x2009;35)</p>
</list-item>
</list>
</td>
<td align="center" valign="top">298</td>
<td align="center" valign="top">132</td>
<td align="center" valign="top">
<bold>121</bold>
</td>
<td align="center" valign="top">
<bold>547</bold>
</td>
<td align="char" valign="top" char=".">
<bold>0.71</bold>
</td>
<td align="char" valign="top" char=".">0.69</td>
<td align="char" valign="top" char=".">
<underline>0.70</underline>
</td>
<td align="char" valign="top" char=".">
<bold>0.77</bold>
</td>
</tr>
<tr>
<td align="left" valign="top">
<list list-type="bullet">
<list-item>
<p>Parsimonious (<italic>K</italic>&#x2009;=&#x2009;16)</p>
</list-item>
</list>
</td>
<td align="center" valign="top">303</td>
<td align="center" valign="top">127</td>
<td align="center" valign="top">
<underline>131</underline>
</td>
<td align="center" valign="top">
<underline>537</underline>
</td>
<td align="char" valign="top" char=".">
<underline>0.70</underline>
</td>
<td align="char" valign="top" char=".">0.70</td>
<td align="char" valign="top" char=".">
<underline>0.70</underline>
</td>
<td align="char" valign="top" char=".">
<bold>0.77</bold>
</td>
</tr>
<tr>
<td align="left" valign="top">
<list list-type="bullet">
<list-item>
<p>Elbow (<italic>K</italic>&#x2009;=&#x2009;7)</p>
</list-item>
</list>
</td>
<td align="center" valign="top">
<underline>335</underline>
</td>
<td align="center" valign="top">
<underline>95</underline>
</td>
<td align="center" valign="top">173</td>
<td align="center" valign="top">495</td>
<td align="char" valign="top" char=".">0.66</td>
<td align="char" valign="top" char=".">
<underline>0.78</underline>
</td>
<td align="char" valign="top" char=".">
<bold>0.71</bold>
</td>
<td align="char" valign="top" char=".">
<underline>0.76</underline>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>The baseline model would always predict positive (translation success). For the random forest model, we showed three scenarios with different feature selection criteria. <italic>K</italic> denotes the number of features selected from the total 68 features. While deploying the model in real life, fewer features would reduce data collection costs. For each metric, the best performance was highlighted in bold, and the second best was highlighted with an underscore.</p>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="sec10">
<title>Sustained response endpoint and subject age as predictors of translation success</title>
<p>We analyzed the feature importance of the best model for each <inline-formula>
<mml:math id="M39">
<mml:mi>c</mml:mi>
</mml:math>
</inline-formula> using five ranking methods: sequential feature selection, linear discriminant analysis (LDA), Pearson correlation coefficient (PCC), impurity-based feature importance of random forest (RF), and SHAP as shown in <xref ref-type="fig" rid="fig4">Figure 4a</xref> for <inline-formula>
<mml:math id="M40">
<mml:mi>c</mml:mi>
</mml:math>
</inline-formula> = 0.5. Of the 16 features selected by SFS, only three were from clinical features. The five ranking methods consensually identified whether clinical and preclinical endpoints were sustained or acute as most influential to the translation prediction (mean rank&#x2009;=&#x2009;1 and 2.2). We found that RF and SHAP could highlight the importance of dosage-relevant features, while linear methods like LDA and PCC could not. A further investigation of SHAP values provided more detailed insights into the relationship between feature values and their impact on predictions. Specifically, the model considered sustained preclinical and clinical endpoints would decrease the translation success probability (mean SHAP value&#x2009;=&#x2009;&#x2212;0.14 for both). This observation can be explained by the significantly lower translation success for samples with sustained preclinical and clinical endpoints compared to those with at least one acute endpoint (<italic>p</italic>-value&#x2009;=&#x2009;3.3 &#x00D7; 10<sup>&#x2212;10</sup>). The model also considered younger subjects for both animals and humans would be more likely to result in translation failure, with the animal age being highly correlated with the SHAP value (p-value&#x2009;=&#x2009;3.9 &#x00D7; 10<sup>&#x2212;298</sup>), with a smaller animal age value resulting in a more negative impact on translation success probability. Also, for the human subjects, the SHAP value of the child age group was significantly smaller than the more-aged group (mean SHAP value&#x2009;=&#x2009;0.01 vs. -0.18; <italic>p</italic>-value&#x2009;=&#x2009;8.7 &#x00D7; 10<sup>&#x2212;164</sup>). The SHAP performance for other <inline-formula>
<mml:math id="M41">
<mml:mi>c</mml:mi>
</mml:math>
</inline-formula> can be found in <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure 5</xref>.</p>
<fig position="float" id="fig4">
<label>Figure 4</label>
<caption>
<p>Comparison of feature importance and SHAP results. The rank of the 16 features, as selected using parsimonious selection criteria of the sequential feature selection, using different analysis methods (LDA: rank based on the absolute value of linear discriminant analysis, PCC: rank based on the absolute value of Pearson correlation coefficient, RF: rank based on random forest, and SHAP: rank based on the absolute value of SHAP). For the beeswarm plot on the right, each dot represents a data point, where red and blue correspond to high and low feature values, respectively. SHAP value indicates the amount of increase in translation success probability the feature causes for that data point. For example, a red dot with a positive SHAP value means that having a high feature value has a positive impact on predicting translation success for that data point.</p>
</caption>
<graphic xlink:href="frai-07-1487335-g004.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="sec11">
<title>Discussion</title>
<p>Our research underscores the importance of refined preclinical strategies in drug development, a principle that holds true across various medical fields. The necessity for improved preclinical approaches, as indicated by the frequent phase III failures due to a lack of responder hypothesis-based trials (<xref ref-type="bibr" rid="ref36">Sun et al., 2022</xref>), aligns with our findings, where a machine learning model driven by a selective feature set significantly enhanced the predictability of translational success.</p>
<p>Our choice to focus on <italic>C. difficile</italic> in this study stems from several key considerations. Firstly, the existence of well-established rodent models for <italic>C. difficile</italic> infection closely mimics the human disease and provides a robust basis for preclinical studies, therefore allowing for more accurate predictions of clinical outcomes. Additionally, the pressing need for improved treatment strategies for <italic>C. difficile</italic> infections, given their increasing prevalence and public health impact, underscores the practical significance of our research. Furthermore, the localized nature of <italic>C. difficile</italic> infections in the gut (<xref ref-type="bibr" rid="ref3">Best et al., 2012</xref>), as opposed to systemic diseases, presents a unique opportunity. It allows for more controlled study parameters and a clearer understanding of treatment effects, which are critical for the successful application of machine learning techniques in predicting translational outcomes. This aspect is particularly vital in lightening the complexity that often accompanies the study of systemic diseases, where multiple organ systems and a myriad of physiological factors can confound results (<xref ref-type="bibr" rid="ref26">Manor and Lipsitz, 2013</xref>).</p>
<p>There are a few areas of improvement. First, we assumed a direct and linear relationship between preclinical survival rates and clinical recovery rates. Yet, it is important to acknowledge that these metrics, while informative, may not fully capture the multifaceted nature of trial outcomes. Future studies could benefit from incorporating additional endpoints, such as percent weight change, patient-reported, and quality-of-life assessments, to provide a more comprehensive evaluation of trial success as well as the clinical utility. This, however, would result in a more complicated definition for translation success, which, in the future, would require us to provide better explanations for our recommendations such that they would be trustworthy and actionable for drug development researchers. Second, rather than employing the delta <inline-formula>
<mml:math id="M42">
<mml:mi>&#x03B4;</mml:mi>
</mml:math>
</inline-formula>, which represents the difference between survival and recovery rates in current work, we could involve using a ratio of these rates. This change would be significant because a 10% difference in lower rates has different implications compared to a 10% difference in higher rates. Third, due to the complicated nature of (pre) clinical experimental designs, comparing results across different studies may have confounding biases resulting from unobserved variables. In this work, for example, we directly modeled the translation between preclinical and clinical trials, while in reality, trials usually consist of comparator groups to account for experimental biases. As a future improvement, we plan to adapt a recent work that used pairwise meta-learning to allow the model to learn across different experiments efficiently (<xref ref-type="bibr" rid="ref11">Feng et al., 2024</xref>). Fourth, we would like to dive deeper into analyzing the impact of dosage regimens on model predictions. During our SHAP analysis, we found that high dosage amounts in preclinical trials had a positive impact on the model predictions on translation success rate, while they had a negative impact in clinical trials. While interesting, SHAP might produce misleading explanations for highly correlated features, e.g., daily dosage amount vs. dosage times per day (<xref ref-type="bibr" rid="ref1">Aas et al., 2021</xref>). Dosage information is essential in drug development, and we aim to conduct a focused, rigorous analysis of dosage regimens for our next study phase. Fifth, the primary challenge of the data curation process is its dependency on expert-guided manual data curation. The current random forest model trained on a small dataset outperformed the state-of-the-art deep learning models, such as neural networks. The advantage of deep neural networks is their capability to generalize the representation to transfer to similar domain datasets (<xref ref-type="bibr" rid="ref20">LeCun et al., 2015</xref>). Implementing an automated data extraction pipeline, leveraging transformer-based large language models (LLMs)(<xref ref-type="bibr" rid="ref21">Lee et al., 2019</xref>; <xref ref-type="bibr" rid="ref40">Vaswani et al., 2017</xref>; <xref ref-type="bibr" rid="ref23">Liu et al., 2023</xref>), would significantly enhance the efficiency of extracting data from existing literature. This enhancement would be beneficial not only for <italic>C. difficile</italic> infection but also for a broader range of bacterial diseases, such as streptococcal infections, tuberculosis, and salmonellosis. By creating a dataset enriched with multi-omics information for these diverse diseases, we can develop a more generalizable ML-based predictor that demonstrates higher performance. We also consider including more clinical variables, such as patient demographics and health conditions, to further enhance the capability of our predictor. Additionally, this enriched dataset would facilitate intra-clinical predictions, such as forecasting the outcomes of clinical trial phase 2 based on phase 1 data.</p>
</sec>
<sec sec-type="conclusions" id="sec12">
<title>Conclusion</title>
<p>This study aims to help translate preclinical findings to clinical outcomes for <italic>Clostridium difficile</italic> infections, leveraging machine learning to enhance predictive accuracy and interpretability. Our model identifies key factors influencing translational success, streamlining drug development for CDI and potentially other diseases. This approach not only promises more effective treatments but also exemplifies the transformative impact of integrating computational methods in modern medicine, paving the way for advancements in personalized healthcare. The source code for our A2H recommendations system can be found at <ext-link xlink:href="https://github.com/IBPA/A2H" ext-link-type="uri">https://github.com/IBPA/A2H</ext-link>.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec13">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found in the article/<xref rid="SM1" ref-type="supplementary-material">Supplementary material</xref>.</p>
</sec>
<sec sec-type="author-contributions" id="sec14">
<title>Author contributions</title>
<p>FL: Formal analysis, Methodology, Software, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. JY: Formal analysis, Methodology, Software, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. CM: Data curation, Formal analysis, Writing &#x2013; review &#x0026; editing. IT: Conceptualization, Funding acquisition, Investigation, Project administration, Resources, Supervision, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec sec-type="funding-information" id="sec15">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research, authorship, and/or publication of this article. This work was supported by the United States Department of Agriculture-National Institute of Food and Agriculture AI Institute for Next Generation Food Systems (AIFS), USDA-NIFA award number 2020&#x2013;67021-32855.</p>
</sec>
<sec sec-type="COI-statement" id="sec16">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="sec17">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="sec18">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/frai.2024.1487335/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/frai.2024.1487335/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.XLSX" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Data_Sheet_2.XLSX" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Data_Sheet_3.docx" id="SM3" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Aas</surname> <given-names>K.</given-names></name> <name><surname>Jullum</surname> <given-names>M.</given-names></name> <name><surname>L&#x00F8;land</surname> <given-names>A.</given-names></name></person-group> (<year>2021</year>). <article-title>Explaining individual predictions when features are dependent: more accurate approximations to Shapley values</article-title>. <source>Artif. Intell.</source> <volume>298</volume>:<fpage>103502</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.artint.2021.103502</pub-id></citation></ref>
<ref id="ref2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Austin</surname> <given-names>C. P.</given-names></name></person-group> (<year>2021</year>). <article-title>Opportunities and challenges in translational science</article-title>. <source>Clin. Transl. Sci.</source> <volume>14</volume>, <fpage>1629</fpage>&#x2013;<lpage>1647</lpage>. doi: <pub-id pub-id-type="doi">10.1111/cts.13055</pub-id>, PMID: <pub-id pub-id-type="pmid">33982407</pub-id></citation></ref>
<ref id="ref3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Best</surname> <given-names>E. L.</given-names></name> <name><surname>Freeman</surname> <given-names>J.</given-names></name> <name><surname>Wilcox</surname> <given-names>M. H.</given-names></name></person-group> (<year>2012</year>). <article-title>Models for the study of <italic>Clostridium difficile</italic> infection</article-title>. <source>Gut Microbes</source> <volume>3</volume>, <fpage>145</fpage>&#x2013;<lpage>167</lpage>. doi: <pub-id pub-id-type="doi">10.4161/gmic.19526</pub-id>, PMID: <pub-id pub-id-type="pmid">22555466</pub-id></citation></ref>
<ref id="ref4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Breiman</surname> <given-names>L.</given-names></name></person-group> (<year>2001</year>). <article-title>Random forests</article-title>. <source>Mach. Learn.</source> <volume>45</volume>, <fpage>5</fpage>&#x2013;<lpage>32</lpage>. doi: <pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id></citation></ref>
<ref id="ref5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chawla</surname> <given-names>N. V.</given-names></name> <name><surname>Bowyer</surname> <given-names>K. W.</given-names></name> <name><surname>Hall</surname> <given-names>L. O.</given-names></name> <name><surname>Kegelmeyer</surname> <given-names>W. P.</given-names></name></person-group> (<year>2002</year>). <article-title>SMOTE: synthetic minority over-sampling technique</article-title>. <source>J. Artif. Intell. Res.</source> <volume>16</volume>, <fpage>321</fpage>&#x2013;<lpage>357</lpage>. doi: <pub-id pub-id-type="doi">10.1613/jair.953</pub-id></citation></ref>
<ref id="ref6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ciociola</surname> <given-names>A. A.</given-names></name> <name><surname>Cohen</surname> <given-names>L. B.</given-names></name> <name><surname>Kulkarni</surname> <given-names>P.</given-names></name> <name><surname>Kefalas</surname> <given-names>C.</given-names></name> <name><surname>Buchman</surname> <given-names>A.</given-names></name> <name><surname>Burke</surname> <given-names>C.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>How drugs are developed and approved by the FDA: current process and future directions</article-title>. <source>Am. J. Gastroenterol.</source> <volume>109</volume>, <fpage>620</fpage>&#x2013;<lpage>623</lpage>. doi: <pub-id pub-id-type="doi">10.1038/ajg.2013.407</pub-id>, PMID: <pub-id pub-id-type="pmid">24796999</pub-id></citation></ref>
<ref id="ref7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Clinical</surname> <given-names>N. B.</given-names></name> <name><surname>Designs</surname> <given-names>T.</given-names></name></person-group> (<year>2019</year>). <article-title>Indian</article-title>. <source>Dermatol. Online J.</source> <volume>10</volume>, <fpage>193</fpage>&#x2013;<lpage>201</lpage>. doi: <pub-id pub-id-type="doi">10.4103/idoj.IDOJ_475_18</pub-id></citation></ref>
<ref id="ref8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cole</surname> <given-names>S. A.</given-names></name> <name><surname>Stahl</surname> <given-names>T. J.</given-names></name></person-group> (<year>2015</year>). <article-title>Persistent and recurrent <italic>Clostridium difficile</italic> colitis</article-title>. <source>Clin. Colon Rectal Surg.</source> <volume>28</volume>, <fpage>065</fpage>&#x2013;<lpage>069</lpage>. doi: <pub-id pub-id-type="doi">10.1055/s-0035-1547333</pub-id>, PMID: <pub-id pub-id-type="pmid">26034401</pub-id></citation></ref>
<ref id="ref9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Czepiel</surname> <given-names>J.</given-names></name> <name><surname>Dr&#x00F3;&#x017C;d&#x017C;</surname> <given-names>M.</given-names></name> <name><surname>Pituch</surname> <given-names>H.</given-names></name> <name><surname>Kuijper</surname> <given-names>E. J.</given-names></name> <name><surname>Perucki</surname> <given-names>W.</given-names></name> <name><surname>Mielimonka</surname> <given-names>A.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title><italic>Clostridium difficile</italic> infection</article-title>. <source>Eur. J. Clin. Microbiol. Infect. Dis.</source> <volume>38</volume>, <fpage>1211</fpage>&#x2013;<lpage>1221</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s10096-019-03539-6</pub-id></citation></ref>
<ref id="ref10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Eetemadi</surname> <given-names>A.</given-names></name> <name><surname>Tagkopoulos</surname> <given-names>I.</given-names></name></person-group> (<year>2019</year>). <article-title>Genetic neural networks: an artificial neural network architecture for capturing gene expression relationships</article-title>. <source>Bioinformatics</source> <volume>35</volume>, <fpage>2226</fpage>&#x2013;<lpage>2234</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/bty945</pub-id>, PMID: <pub-id pub-id-type="pmid">30452523</pub-id></citation></ref>
<ref id="ref11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Feng</surname> <given-names>B.</given-names></name> <name><surname>Liu</surname> <given-names>Z.</given-names></name> <name><surname>Huang</surname> <given-names>N.</given-names></name> <name><surname>Xiao</surname> <given-names>Z.</given-names></name> <name><surname>Zhang</surname> <given-names>H.</given-names></name> <name><surname>Mirzoyan</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>A bioactivity foundation model using pairwise meta-learning</article-title>. <source>Nat. Mach. Intell.</source> <volume>6</volume>, <fpage>962</fpage>&#x2013;<lpage>974</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s42256-024-00876-w</pub-id></citation></ref>
<ref id="ref12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fogel</surname> <given-names>D. B.</given-names></name></person-group> (<year>2018</year>). <article-title>Factors associated with clinical trials that fail and opportunities for improving the likelihood of success: a review</article-title>. <source>Contemp. Clin. Trials Commun.</source> <volume>11</volume>, <fpage>156</fpage>&#x2013;<lpage>164</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.conctc.2018.08.001</pub-id>, PMID: <pub-id pub-id-type="pmid">30112460</pub-id></citation></ref>
<ref id="ref13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Freund</surname> <given-names>Y.</given-names></name> <name><surname>Schapire</surname> <given-names>R. E.</given-names></name></person-group> (<year>1997</year>). <article-title>A decision-theoretic generalization of on-line learning and an application to boosting</article-title>. <source>J. Comput. Syst. Sci.</source> <volume>55</volume>, <fpage>119</fpage>&#x2013;<lpage>139</lpage>. doi: <pub-id pub-id-type="doi">10.1006/jcss.1997.1504</pub-id></citation></ref>
<ref id="ref14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gayvert</surname> <given-names>K. M.</given-names></name> <name><surname>Madhukar</surname> <given-names>N. S.</given-names></name> <name><surname>Elemento</surname> <given-names>O.</given-names></name></person-group> (<year>2016</year>). <article-title>A data-driven approach to predicting successes and failures of clinical trials</article-title>. <source>Cell Chem. Biol.</source> <volume>23</volume>, <fpage>1294</fpage>&#x2013;<lpage>1301</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.chembiol.2016.07.023</pub-id>, PMID: <pub-id pub-id-type="pmid">27642066</pub-id></citation></ref>
<ref id="ref15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hinton</surname> <given-names>G. E.</given-names></name></person-group> (<year>1990</year>). <article-title>20- CONNECTIONIST LEARNING PROCEDURES11This chapter appeared in volume 40 of artificial intelligence in 1989, reprinted with permission of North-Holland publishing. It is a revised version of technical report CMU-CS-87-115, which has the same title and was prepared in June 1987 while the author was at Carnegie Mellon University. The research was supported by contract N00014-86-K-00167 from the Office of Naval Research and by grant IST-8520359 from the National Science Foundation</article-title>. <source>Mach. Learn.</source> <volume>1</volume>, <fpage>555</fpage>&#x2013;<lpage>610</lpage>.</citation></ref>
<ref id="ref16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Johnson</surname> <given-names>S.</given-names></name> <name><surname>Louie</surname> <given-names>T. J.</given-names></name> <name><surname>Gerding</surname> <given-names>D. N.</given-names></name> <name><surname>Cornely</surname> <given-names>O. A.</given-names></name> <name><surname>Chasan-Taber</surname> <given-names>S.</given-names></name> <name><surname>Fitts</surname> <given-names>D.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Vancomycin, metronidazole, or tolevamer for <italic>Clostridium difficile</italic> infection: results from two multinational, randomized, controlled trials</article-title>. <source>Clin. Infect. Dis.</source> <volume>59</volume>, <fpage>345</fpage>&#x2013;<lpage>354</lpage>. doi: <pub-id pub-id-type="doi">10.1093/cid/ciu313</pub-id></citation></ref>
<ref id="ref17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kaye</surname> <given-names>K. S.</given-names></name> <name><surname>Harris</surname> <given-names>A. D.</given-names></name> <name><surname>Samore</surname> <given-names>M.</given-names></name> <name><surname>Carmeli</surname> <given-names>Y.</given-names></name></person-group> (<year>2005</year>). <article-title>The case-case-control study design: addressing the limitations of risk factor studies for antimicrobial resistance</article-title>. <source>Infect. Control Hosp. Epidemiol.</source> <volume>26</volume>, <fpage>346</fpage>&#x2013;<lpage>351</lpage>. doi: <pub-id pub-id-type="doi">10.1086/502550</pub-id>, PMID: <pub-id pub-id-type="pmid">15865269</pub-id></citation></ref>
<ref id="ref18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kluger</surname> <given-names>Y.</given-names></name> <name><surname>Basri</surname> <given-names>R.</given-names></name> <name><surname>Chang</surname> <given-names>J. T.</given-names></name> <name><surname>Gerstein</surname> <given-names>M.</given-names></name></person-group> (<year>2003</year>). <article-title>Spectral biclustering of microarray data: coclustering genes and conditions</article-title>. <source>Genome Res.</source> <volume>13</volume>, <fpage>703</fpage>&#x2013;<lpage>716</lpage>. doi: <pub-id pub-id-type="doi">10.1101/gr.648603</pub-id>, PMID: <pub-id pub-id-type="pmid">12671006</pub-id></citation></ref>
<ref id="ref19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kola</surname> <given-names>I.</given-names></name> <name><surname>Landis</surname> <given-names>J.</given-names></name></person-group> (<year>2004</year>). <article-title>Can the pharmaceutical industry reduce attrition rates?</article-title> <source>Nat. Rev. Drug Discov.</source> <volume>3</volume>, <fpage>711</fpage>&#x2013;<lpage>716</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nrd1470</pub-id></citation></ref>
<ref id="ref20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>LeCun</surname> <given-names>Y.</given-names></name> <name><surname>Bengio</surname> <given-names>Y.</given-names></name> <name><surname>Hinton</surname> <given-names>G.</given-names></name></person-group> (<year>2015</year>). <article-title>Deep learning</article-title>. <source>Nature</source> <volume>521</volume>, <fpage>436</fpage>&#x2013;<lpage>444</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nature14539</pub-id></citation></ref>
<ref id="ref21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname> <given-names>J.</given-names></name> <name><surname>Yoon</surname> <given-names>W.</given-names></name> <name><surname>Kim</surname> <given-names>S.</given-names></name> <name><surname>Kim</surname> <given-names>D.</given-names></name> <name><surname>Kim</surname> <given-names>S.</given-names></name> <name><surname>So</surname> <given-names>C. H.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>Bio BERT: a pre-trained biomedical language representation model for biomedical text mining</article-title>. <source>Bioinformatics</source> <volume>36</volume>, <fpage>1234</fpage>&#x2013;<lpage>1240</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btz682</pub-id></citation></ref>
<ref id="ref22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lipton</surname> <given-names>Z. C.</given-names></name></person-group> (<year>2017</year>). <article-title>The mythos of model interpretability</article-title>. <source>Comput. Sci.</source> <volume>2017</volume>:<fpage>3490</fpage>. doi: <pub-id pub-id-type="doi">10.48550/arXiv.1606.03490</pub-id></citation></ref>
<ref id="ref23"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>X.</given-names></name> <name><surname>Zheng</surname> <given-names>Y.</given-names></name> <name><surname>Du</surname> <given-names>Z.</given-names></name> <name><surname>Ding</surname> <given-names>M.</given-names></name> <name><surname>Qian</surname> <given-names>Y.</given-names></name> <name><surname>Yang</surname> <given-names>Z.</given-names></name> <etal/></person-group>. (<year>2023</year>). <italic>GPT understands, too</italic>. AI Open. Available at: <ext-link xlink:href="https://www.sciencedirect.com/science/article/pii/S2666651023000141" ext-link-type="uri">https://www.sciencedirect.com/science/article/pii/S2666651023000141</ext-link>.</citation></ref>
<ref id="ref24"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Lundberg</surname> <given-names>S. M.</given-names></name> <name><surname>Lee</surname> <given-names>S. I.</given-names></name></person-group> (<year>2017</year>). <article-title>A unified approach to interpreting model predictions</article-title>. In: Proceedings of the 31st international conference on neural information processing systems. Red hook, NY, USA: Curran associates Inc., pp. 4768&#x2013;4777.</citation></ref>
<ref id="ref25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lysenko</surname> <given-names>A.</given-names></name> <name><surname>Sharma</surname> <given-names>A.</given-names></name> <name><surname>Boroevich</surname> <given-names>K. A.</given-names></name> <name><surname>Tsunoda</surname> <given-names>T.</given-names></name></person-group> (<year>2018</year>). <article-title>An integrative machine learning approach for prediction of toxicity-related drug safety</article-title>. <source>Life Sci. Alliance</source> <volume>1</volume>:<fpage>e201800098</fpage>. doi: <pub-id pub-id-type="doi">10.26508/lsa.201800098</pub-id>, PMID: <pub-id pub-id-type="pmid">30515477</pub-id></citation></ref>
<ref id="ref26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Manor</surname> <given-names>B.</given-names></name> <name><surname>Lipsitz</surname> <given-names>L. A.</given-names></name></person-group> (<year>2013</year>). <article-title>Physiologic complexity and aging: implications for physical function and rehabilitation</article-title>. <source>Prog. Neuro-Psychopharmacol. Biol. Psychiatry</source> <volume>45</volume>, <fpage>287</fpage>&#x2013;<lpage>293</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.pnpbp.2012.08.020</pub-id>, PMID: <pub-id pub-id-type="pmid">22985940</pub-id></citation></ref>
<ref id="ref27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>McFarland</surname> <given-names>L. V.</given-names></name> <name><surname>Surawicz</surname> <given-names>C. M.</given-names></name> <name><surname>Rubin</surname> <given-names>M.</given-names></name> <name><surname>Fekety</surname> <given-names>R.</given-names></name> <name><surname>Elmer</surname> <given-names>G. W.</given-names></name> <name><surname>Greenberg</surname> <given-names>R. N.</given-names></name></person-group> (<year>1999</year>). <article-title>Recurrent <italic>Clostridium difficile</italic> disease: epidemiology and Clinical characteristics</article-title>. <source>Infect. Control Hosp. Epidemiol.</source> <volume>20</volume>, <fpage>43</fpage>&#x2013;<lpage>50</lpage>. doi: <pub-id pub-id-type="doi">10.1086/501553</pub-id></citation></ref>
<ref id="ref28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Paul</surname> <given-names>S. M.</given-names></name> <name><surname>Mytelka</surname> <given-names>D. S.</given-names></name> <name><surname>Dunwiddie</surname> <given-names>C. T.</given-names></name> <name><surname>Persinger</surname> <given-names>C. C.</given-names></name> <name><surname>Munos</surname> <given-names>B. H.</given-names></name> <name><surname>Lindborg</surname> <given-names>S. R.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>How to improve R &#x0026; D productivity: the pharmaceutical industry&#x2019;s grand challenge</article-title>. <source>Nat. Rev. Drug Discov.</source> <volume>9</volume>, <fpage>203</fpage>&#x2013;<lpage>214</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nrd3078</pub-id></citation></ref>
<ref id="ref29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pedregosa</surname> <given-names>F.</given-names></name> <name><surname>Varoquaux</surname> <given-names>G.</given-names></name> <name><surname>Gramfort</surname> <given-names>A.</given-names></name> <name><surname>Michel</surname> <given-names>V.</given-names></name> <name><surname>Thirion</surname> <given-names>B.</given-names></name> <name><surname>Grisel</surname> <given-names>O.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>Scikit-learn: machine learning in Python</article-title>. <source>J. Mach. Learn. Res.</source> <volume>12</volume>, <fpage>2825</fpage>&#x2013;<lpage>2830</lpage>.  doi: <pub-id pub-id-type="doi">10.48550/arXiv.1201.0490</pub-id></citation></ref>
<ref id="ref30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Raschka</surname> <given-names>S.</given-names></name></person-group> (<year>2018</year>). <article-title>MLxtend: providing machine learning and data science utilities and extensions to Python&#x2019;s scientific computing stack</article-title>. <source>J. Open Source Softw.</source> <volume>3</volume>:<fpage>638</fpage>. doi: <pub-id pub-id-type="doi">10.21105/joss.00638</pub-id></citation></ref>
<ref id="ref31"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Satopaa</surname> <given-names>V.</given-names></name> <name><surname>Albrecht</surname> <given-names>J.</given-names></name> <name><surname>Irwin</surname> <given-names>D.</given-names></name> <name><surname>Raghavan</surname> <given-names>B.</given-names></name></person-group> (<year>2011</year>). <italic>Finding a &#x201C;Kneedle&#x201D; in a haystack: detecting knee points in system behavior</italic>. In: 2011 31st international conference on distributed computing systems workshops, pp. 166&#x2013;171.</citation></ref>
<ref id="ref32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Seyhan</surname> <given-names>A. A.</given-names></name></person-group> (<year>2019</year>). <article-title>Lost in translation: the valley of death across preclinical and clinical divide &#x2013; identification of problems and overcoming obstacles</article-title>. <source>Transl. Med. Commun.</source> <volume>4</volume>, <fpage>1</fpage>&#x2013;<lpage>19</lpage>. doi: <pub-id pub-id-type="doi">10.1186/s41231-019-0050-7</pub-id></citation></ref>
<ref id="ref33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shah</surname> <given-names>P.</given-names></name> <name><surname>Kendall</surname> <given-names>F.</given-names></name> <name><surname>Khozin</surname> <given-names>S.</given-names></name> <name><surname>Goosen</surname> <given-names>R.</given-names></name> <name><surname>Hu</surname> <given-names>J.</given-names></name> <name><surname>Laramie</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>Artificial intelligence and machine learning in clinical development: a translational perspective</article-title>. <source>NPJ Digit. Med.</source> <volume>2</volume>, <fpage>1</fpage>&#x2013;<lpage>5</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41746-019-0148-3</pub-id></citation></ref>
<ref id="ref34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shultz</surname> <given-names>L. D.</given-names></name> <name><surname>Ishikawa</surname> <given-names>F.</given-names></name> <name><surname>Greiner</surname> <given-names>D. L.</given-names></name></person-group> (<year>2007</year>). <article-title>Humanized mice in translational biomedical research</article-title>. <source>Nat. Rev. Immunol.</source> <volume>7</volume>, <fpage>118</fpage>&#x2013;<lpage>130</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nri2017</pub-id></citation></ref>
<ref id="ref35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Smits</surname> <given-names>W. K.</given-names></name> <name><surname>Lyras</surname> <given-names>D.</given-names></name> <name><surname>Lacy</surname> <given-names>D. B.</given-names></name> <name><surname>Wilcox</surname> <given-names>M. H.</given-names></name> <name><surname>Kuijper</surname> <given-names>E. J.</given-names></name></person-group> (<year>2016</year>). <article-title><italic>Clostridium difficile</italic> infection</article-title>. <source>Nat. Rev. Dis. Prim.</source> <volume>2</volume>, <fpage>1</fpage>&#x2013;<lpage>20</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nrdp.2016.20</pub-id></citation></ref>
<ref id="ref36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sun</surname> <given-names>D.</given-names></name> <name><surname>Gao</surname> <given-names>W.</given-names></name> <name><surname>Hu</surname> <given-names>H.</given-names></name> <name><surname>Zhou</surname> <given-names>S.</given-names></name></person-group> (<year>2022</year>). <article-title>Why 90% of clinical drug development fails and how to improve it?</article-title> <source>Acta Pharm. Sin. B</source> <volume>12</volume>, <fpage>3049</fpage>&#x2013;<lpage>3062</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.apsb.2022.02.002</pub-id>, PMID: <pub-id pub-id-type="pmid">35865092</pub-id></citation></ref>
<ref id="ref37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Teasley</surname> <given-names>D.</given-names></name> <name><surname>Olson</surname> <given-names>M.</given-names></name> <name><surname>Gebhard</surname> <given-names>R.</given-names></name> <name><surname>Gerding</surname> <given-names>D.</given-names></name> <name><surname>Peterson</surname> <given-names>L.</given-names></name> <name><surname>Schwartz</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>1983</year>). <article-title>Prospective randomised trial of metronidazole versus vancomycin for Clostridium-difficile-associated diarrhoea and colitis</article-title>. <source>Lancet</source> <volume>322</volume>, <fpage>1043</fpage>&#x2013;<lpage>1046</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0140-6736(83)91036-X</pub-id></citation></ref>
<ref id="ref38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Toh</surname> <given-names>T. S.</given-names></name> <name><surname>Dondelinger</surname> <given-names>F.</given-names></name> <name><surname>Wang</surname> <given-names>D.</given-names></name></person-group> (<year>2019</year>). <article-title>Looking beyond the hype: applied AI and machine learning in translational medicine</article-title>. <source>EBioMedicine</source> <volume>47</volume>, <fpage>607</fpage>&#x2013;<lpage>615</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ebiom.2019.08.027</pub-id>, PMID: <pub-id pub-id-type="pmid">31466916</pub-id></citation></ref>
<ref id="ref39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Van Giau</surname> <given-names>V.</given-names></name> <name><surname>Lee</surname> <given-names>H.</given-names></name> <name><surname>An</surname> <given-names>S. S. A.</given-names></name> <name><surname>Hulme</surname> <given-names>J.</given-names></name></person-group> (<year>2019</year>). <article-title>Recent advances in the treatment of <italic>C. difficile</italic> using biotherapeutic agents</article-title>. <source>Infect. Drug Resist.</source> <volume>12</volume>, <fpage>1597</fpage>&#x2013;<lpage>1615</lpage>. doi: <pub-id pub-id-type="doi">10.2147/IDR.S207572</pub-id>, PMID: <pub-id pub-id-type="pmid">31354309</pub-id></citation></ref>
<ref id="ref40"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Vaswani</surname> <given-names>A.</given-names></name> <name><surname>Shazeer</surname> <given-names>N.</given-names></name> <name><surname>Parmar</surname> <given-names>N.</given-names></name> <name><surname>Uszkoreit</surname> <given-names>J.</given-names></name> <name><surname>Jones</surname> <given-names>L.</given-names></name> <name><surname>Gomez</surname> <given-names>A. N.</given-names></name> <etal/></person-group>. (<year>2017</year>). <italic>Attention is all you need</italic>. In: Advances in neural information processing systems. Curran associates, Inc. Available at: <ext-link xlink:href="https://proceedings.neurips.cc/paper_files/paper/2017/hash/3f5ee243547dee91fbd053c1c4a845aa-Abstract.html" ext-link-type="uri">https://proceedings.neurips.cc/paper_files/paper/2017/hash/3f5ee243547dee91fbd053c1c4a845aa-Abstract.html</ext-link>.</citation></ref>
<ref id="ref41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ventz</surname> <given-names>S.</given-names></name> <name><surname>Cellamare</surname> <given-names>M.</given-names></name> <name><surname>Parmigiani</surname> <given-names>G.</given-names></name> <name><surname>Trippa</surname> <given-names>L.</given-names></name></person-group> (<year>2018</year>). <article-title>Adding experimental arms to platform clinical trials: randomization procedures and interim analyses</article-title>. <source>Biostatistics</source> <volume>19</volume>, <fpage>199</fpage>&#x2013;<lpage>215</lpage>. doi: <pub-id pub-id-type="doi">10.1093/biostatistics/kxx030</pub-id></citation></ref>
<ref id="ref42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>W.</given-names></name> <name><surname>Kiik</surname> <given-names>M.</given-names></name> <name><surname>Peek</surname> <given-names>N.</given-names></name> <name><surname>Curcin</surname> <given-names>V.</given-names></name> <name><surname>Marshall</surname> <given-names>I. J.</given-names></name> <name><surname>Rudd</surname> <given-names>A. G.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>A systematic review of machine learning models for predicting outcomes of stroke with structured data</article-title>. <source>PLoS One</source> <volume>15</volume>:<fpage>e0234722</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0234722</pub-id>, PMID: <pub-id pub-id-type="pmid">32530947</pub-id></citation></ref>
<ref id="ref43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yu</surname> <given-names>D.</given-names></name></person-group> (<year>2011</year>). <article-title>Translational research: current status, challenges and future strategies</article-title>. <source>Am. J. Transl. Res.</source> <volume>3</volume>, <fpage>422</fpage>&#x2013;<lpage>433</lpage>, PMID: <pub-id pub-id-type="pmid">22046484</pub-id></citation></ref>
<ref id="ref44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zar</surname> <given-names>F. A.</given-names></name> <name><surname>Bakkanagari</surname> <given-names>S. R.</given-names></name> <name><surname>Moorthi</surname> <given-names>K.</given-names></name> <name><surname>Davis</surname> <given-names>M. B.</given-names></name></person-group> (<year>2007</year>). <article-title>A comparison of vancomycin and metronidazole for the treatment of <italic>Clostridium difficile</italic>-associated diarrhea, stratified by disease severity</article-title>. <source>Clin. Infect. Dis.</source> <volume>45</volume>, <fpage>302</fpage>&#x2013;<lpage>307</lpage>. doi: <pub-id pub-id-type="doi">10.1086/519265</pub-id>, PMID: <pub-id pub-id-type="pmid">17599306</pub-id></citation></ref>
<ref id="ref45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhuang</surname> <given-names>S. H.</given-names></name> <name><surname>Xiu</surname> <given-names>L.</given-names></name> <name><surname>Elsayed</surname> <given-names>Y. A.</given-names></name></person-group> (<year>2009</year>). <article-title>Overall survival: a gold standard in search of a surrogate: the value of progression-free survival and time to progression as end points of drug efficacy</article-title>. <source>Cancer J.</source> <volume>15</volume>, <fpage>395</fpage>&#x2013;<lpage>400</lpage>. doi: <pub-id pub-id-type="doi">10.1097/PPO.0b013e3181be231d</pub-id>, PMID: <pub-id pub-id-type="pmid">19826359</pub-id></citation></ref>
</ref-list>
</back>
</article>