<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Chem.</journal-id>
<journal-title>Frontiers in Chemistry</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Chem.</abbrev-journal-title>
<issn pub-type="epub">2296-2646</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1503593</article-id>
<article-id pub-id-type="doi">10.3389/fchem.2024.1503593</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Chemistry</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Machine learning and molecular dynamics simulations predict potential TGR5 agonists for type 2 diabetes treatment</article-title>
<alt-title alt-title-type="left-running-head">Enejoh et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fchem.2024.1503593">10.3389/fchem.2024.1503593</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Enejoh</surname>
<given-names>Ojochenemi A.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2385636/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Okonkwo</surname>
<given-names>Chinelo H.</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2483533/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Nortey</surname>
<given-names>Hector</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2932817/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Kemiki</surname>
<given-names>Olalekan A.</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Moses</surname>
<given-names>Ainembabazi</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2856731/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Mbaoji</surname>
<given-names>Florence N.</given-names>
</name>
<xref ref-type="aff" rid="aff7">
<sup>7</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yusuf</surname>
<given-names>Abdulrazak S.</given-names>
</name>
<xref ref-type="aff" rid="aff8">
<sup>8</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2866379/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Awe</surname>
<given-names>Olaitan I.</given-names>
</name>
<xref ref-type="aff" rid="aff9">
<sup>9</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1929418/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Genetics, Genomics and Bioinformatics Department</institution>, <institution>National Biotechnology Research and Development Agency</institution>, <addr-line>Abuja</addr-line>, <country>Nigeria</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Pharmacy</institution>, <institution>National Hospital Abuja</institution>, <addr-line>Abuja</addr-line>, <country>Nigeria</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Department of Clinical Pathology</institution>, <institution>Noguchi Memorial Institute for Medical Research</institution>, <institution>College of Health Science</institution>, <institution>University of Ghana</institution>, <addr-line>Accra</addr-line>, <country>Ghana</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Molecular and Tissue Culture Laboratory</institution>, <institution>Babcock University</institution>, <addr-line>Ilisan-remo</addr-line>, <addr-line>Ogun State</addr-line>, <country>Nigeria</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>African Centers of Excellence in Bioinformatics and data intensive sciences</institution>, <institution>Department of Immunology and Microbiology</institution>, <institution>Makerere University</institution>, <addr-line>Makerere</addr-line>, <country>Uganda</country>
</aff>
<aff id="aff6">
<sup>6</sup>
<institution>Infectious Disease Institute (IDI)</institution>, <institution>Makerere University</institution>, <addr-line>Kampala</addr-line>, <country>Uganda</country>
</aff>
<aff id="aff7">
<sup>7</sup>
<institution>Department of Pharmacology and Toxicology</institution>, <institution>Faculty of Pharmaceutical Sciences</institution>, <institution>University of Nigeria</institution>, <addr-line>Nsukka</addr-line>, <addr-line>Enugu</addr-line>, <country>Nigeria</country>
</aff>
<aff id="aff8">
<sup>8</sup>
<institution>Department of Biochemistry</institution>, <institution>Faculty of Basic Health Science</institution>, <institution>Bayero University</institution>, <addr-line>Kano</addr-line>, <country>Nigeria</country>
</aff>
<aff id="aff9">
<sup>9</sup>
<institution>African Society for Bioinformatics and Computational Biology</institution>, <addr-line>Cape Town</addr-line>, <country>South Africa</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/653205/overview">Marko Jukic</ext-link>, University of Maribor, Slovenia</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1744367/overview">Titilayo Omolara Johnson</ext-link>, University of Jos, Nigeria</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2858706/overview">Jessica Elena Mendieta Wejebe</ext-link>, Instituto Polit&#xe9;cnico Nacional, Mexico</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Ojochenemi A. Enejoh, <email>chenemidala@gmail.com</email>; Olaitan I. Awe, <email>laitanawe@gmail.com</email>
</corresp>
<fn fn-type="other" id="fn1">
<label>
<sup>&#x2020;</sup>
</label>
<p>ORCID: Ojochenemi A. Enejoh, <ext-link ext-link-type="uri" xlink:href="http://orcid.org/0000-0002-5684-2472">orcid.org/0000-0002-5684-2472</ext-link>; Chinelo H. Okonkwo, <ext-link ext-link-type="uri" xlink:href="http://orcid.org/0000-0001-5421-8054">orcid.org/0000-0001-5421-8054</ext-link>; Florence N. Mbaoji, <ext-link ext-link-type="uri" xlink:href="http://orcid.org/0000-0002-9705-3250">orcid.org/0000-0002-9705-3250</ext-link>; Abdulrazak S. Yusuf, <ext-link ext-link-type="uri" xlink:href="http://orcid.org/0000-0002-7649-4022">orcid.org/0000-0002-7649-4022</ext-link>; Olaitan I. Awe, <ext-link ext-link-type="uri" xlink:href="http://orcid.org/0000-0002-4257-3611">orcid.org/0000-0002-4257-3611</ext-link>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>09</day>
<month>01</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>12</volume>
<elocation-id>1503593</elocation-id>
<history>
<date date-type="received">
<day>29</day>
<month>09</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>13</day>
<month>12</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Enejoh, Okonkwo, Nortey, Kemiki, Moses, Mbaoji, Yusuf and Awe.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Enejoh, Okonkwo, Nortey, Kemiki, Moses, Mbaoji, Yusuf and Awe</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>Treatment of type 2 diabetes (T2D) remains a significant challenge because of its multifactorial nature and complex metabolic pathways. There is growing interest in finding new therapeutic targets that could lead to safer and more effective treatment options. Takeda G protein-coupled receptor 5 (TGR5) is a promising antidiabetic target that plays a key role in metabolic regulation, especially in glucose homeostasis and energy expenditure. TGR5 agonists are attractive candidates for T2D therapy because of their ability to improve glycemic control. This study used machine learning-based models (ML), molecular docking (MD), and molecular dynamics simulations (MDS) to explore novel small molecules as potential TGR5 agonists.</p>
</sec>
<sec>
<title>Methods</title>
<p>Bioactivity data for known TGR5 agonists were obtained from the ChEMBL database. The dataset was cleaned and molecular descriptors based on Lipinski&#x2019;s rule of five were selected as input features for the ML model, which was built using the Random Forest algorithm. The optimized ML model was used to screen the COCONUT database and predict potential TGR5 agonists based on their molecular features. 6,656 compounds predicted from the COCONUT database were docked within the active site of TGR5 to calculate their binding energies. The four top-scoring compounds with the lowest binding energies were selected and their activities were compared to those of the co-crystallized ligand. A 100&#xa0;ns MDS was used to assess the binding stability of the compounds to TGR5.</p>
</sec>
<sec>
<title>Results</title>
<p>Molecular docking results showed that the lead compounds had a stronger affinity for TGR5 than the cocrystallized ligand. MDS revealed that the lead compounds were stable within the TGR5 binding pocket.</p>
</sec>
<sec>
<title>Discussion</title>
<p>The combination of ML, MD, and MDS provides a powerful approach for predicting new TGR5 agonists that can be optimised for T2D treatment.</p>
</sec>
</abstract>
<kwd-group>
<kwd>TGR5</kwd>
<kwd>type 2 diabetes</kwd>
<kwd>machine learning</kwd>
<kwd>molecular docking</kwd>
<kwd>molecular dynamics simulation</kwd>
<kwd>COCONUT database</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Medicinal and Pharmaceutical Chemistry</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Type 2 diabetes (T2D) is an escalating metabolic disorder of global health concern (<xref ref-type="bibr" rid="B38">Ong et al., 2023</xref>). This disease is characterised by persistent hyperglycaemia due to insulin resistance and an eventual decline in pancreatic &#x3b2;-cell function (<xref ref-type="bibr" rid="B8">Bhatti et al., 2022</xref>; <xref ref-type="bibr" rid="B19">Deol and Bashir, 2024</xref>). In 2017, approximately 462&#xa0;million people worldwide were affected by T2DM (<xref ref-type="bibr" rid="B1">Abdul Basith Khan et al., 2020</xref>). Individuals with T2DM are susceptible to long-term complications, including cardiovascular disease, neuropathy, retinopathy, and kidney failure, which lead to significant morbidity and mortality (<xref ref-type="bibr" rid="B18">DeFronzo et al., 2015</xref>; <xref ref-type="bibr" rid="B14">Chatterjee et al., 2017</xref>; <xref ref-type="bibr" rid="B47">Sharma et al., 2024</xref>). Although genetic factors have been correlated with the pathogenesis of the disease, environmental factors (consumption of unhealthy diet, reduced physical activity, and obesity) enhance pathophysiological anomalies associated with defective glucose homeostasis (<xref ref-type="bibr" rid="B2">Abolo et al., 2024</xref>; <xref ref-type="bibr" rid="B28">Mansour et al., 2023</xref>; <xref ref-type="bibr" rid="B25">Ikwuka et al., 2023</xref>).</p>
<p>Takeda G protein-coupled receptor 5 (TGR5) is a member of the G protein-coupled receptor (GPCR), class A (<xref ref-type="bibr" rid="B53">Thomas et al., 2008</xref>; <xref ref-type="bibr" rid="B24">Guo et al., 2016</xref>). TGR5 has emerged as a promising target in the context of T2DM owing to its involvement in glucose homeostasis, energy expenditure, and anti-inflammatory pathways (<xref ref-type="bibr" rid="B45">Sato et al., 2007</xref>; <xref ref-type="bibr" rid="B10">Bhimanwar and Mittal, 2021</xref>). TGR5 is activated by bile acids and plays a crucial role in regulating metabolic processes in various tissues, including the liver, pancreas, and adipose tissue (<xref ref-type="bibr" rid="B27">Lun et al., 2023</xref>)</p>
<p>Despite its potential, development of a TGR5 agonist as a therapeutic agent has faced several challenges. Identifying selective and potent TGR5 agonists is complicated by the structural flexibility of the receptor and the need for compounds that can cross biological membranes and exhibit favourable pharmacokinetic properties. Moreover, many identified TGR5 agonists have off-target effects or are associated with safety concerns, particularly regarding their impact on the gastrointestinal system.</p>
<p>Recent studies have shown the use of multi-omics and transcriptomic data integration approaches to predict potential biomarkers for diseases (<xref ref-type="bibr" rid="B4">Alaya et al., 2024</xref>; <xref ref-type="bibr" rid="B6">Ben Aribi et al., 2024</xref>; <xref ref-type="bibr" rid="B15">Chikwambi et al., 2023</xref>; <xref ref-type="bibr" rid="B21">El Abed et al., 2023</xref>; <xref ref-type="bibr" rid="B33">Nzungize et al., 2022</xref>; <xref ref-type="bibr" rid="B55">Wesonga and Awe, 2022</xref>), as well as to understand disease susceptibility (<xref ref-type="bibr" rid="B32">Nyamari et al., 2023</xref>). Other studies have also provided intriguing insights into viral evolution, diversity, and variation using computational approaches (<xref ref-type="bibr" rid="B5">Awe et al., 2023</xref>; <xref ref-type="bibr" rid="B31">Mwanga et al., 2023</xref>; <xref ref-type="bibr" rid="B34">Obura et al., 2022</xref>; <xref ref-type="bibr" rid="B37">Oluwagbemi and Awe, 2018</xref>).</p>
<p>In the field of drug discovery, machine learning (ML), molecular docking (MD), and molecular dynamics simulations (MDS) have revolutionized the identification and optimization of novel drug candidates (<xref ref-type="bibr" rid="B20">Di Stefano et al., 2022</xref>; <xref ref-type="bibr" rid="B43">Sadybekov and Katritch, 2023</xref>). ML models can rapidly analyze vast chemical libraries and predict the bioactivity of compounds with high accuracy, thereby significantly reducing the time and cost associated with traditional drug discovery methods (<xref ref-type="bibr" rid="B20">Di Stefano et al., 2022</xref>; <xref ref-type="bibr" rid="B9">Bhimanwar et al., 2023</xref>). Molecular docking studies provide insight into the interactions between small molecules and their target receptors, enabling the identification of key binding interactions that contribute to receptor activation or inhibition (<xref ref-type="bibr" rid="B30">Mursal et al., 2024</xref>). MDS further refines these predictions by accounting for the dynamic nature of protein-ligand interactions, providing a more realistic assessment of a compound&#x2019;s stability and efficacy (<xref ref-type="bibr" rid="B35">Ogbodo et al., 2023</xref>; <xref ref-type="bibr" rid="B11">Brueckner et al., 2024</xref>).</p>
<p>Recent advancements in machine learning have led to the development of sophisticated algorithms capable of learning complex patterns in chemical data, enabling the prediction of bioactive compounds from diverse chemical spaces (<xref ref-type="bibr" rid="B54">van Heerden et al., 2023</xref>). In the context of TGR5 agonist discovery, several studies have applied ML techniques to screen compound libraries and predict potential agonists (<xref ref-type="bibr" rid="B41">Qin et al., 2023</xref>). Furthermore, molecular docking has been used to explore the binding interactions of the predicted agonists with TGR5 (<xref ref-type="bibr" rid="B50">Sindhu and Srinivasan, 2015</xref>). This study aims to contribute to the growing field of TGR5-targeted therapies by providing a systematic and validated approach for the discovery of potential TGR5 agonists.</p>
</sec>
<sec sec-type="methods" id="s2">
<title>2 Methods</title>
<sec id="s2-1">
<title>2.1 Machine learning</title>
<p>The workflow pipeline used in this study is summarised in <xref ref-type="fig" rid="F1">Figure 1</xref>.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>The workflow pipeline used in this study. It is divided into three parts: Machine learning, molecular docking, and molecular dynamics simulation.</p>
</caption>
<graphic xlink:href="fchem-12-1503593-g001.tif"/>
</fig>
<sec id="s2-1-1">
<title>2.1.1 Data collection and preprocessing</title>
<p>Bioactivity data of compounds with biological activity for TGR5 (CHEMBL5409), which are expressed as EC<sub>50</sub> values in nM (nanomolar), was downloaded from the ChEMBL database (<ext-link ext-link-type="uri" xlink:href="https://www.ebi.ac.uk/chembl/">https://www.ebi.ac.uk/chembl/</ext-link>) (<xref ref-type="bibr" rid="B7">Bento et al., 2014</xref>; <xref ref-type="bibr" rid="B23">Gaulton et al., 2017</xref>). ChEMBL is a comprehensive, curated bioactivity database containing information on molecule-target interactions extracted from published literature. The data were cleaned, which involved removing any compounds with missing EC<sub>50</sub> values, those without smile notation and redundant bioactivity values. For the data preprocessing step, compounds were classified as active if their values were less than 1,000&#xa0;nM, and inactive if they were more than 10,000&#xa0;nM. Values between 1,000 and 10,000&#xa0;nM were considered intermediate. The intermediate category was removed, leading to an exploratory data analysis that focused only on active and inactive compounds.</p>
</sec>
<sec id="s2-1-2">
<title>2.1.2 Exploratory data analysis</title>
<p>The dataset includes chemical names and corresponding SMILES notations, which provide information about the molecular structure used to calculate the molecular descriptors. The drug-likeness of the compounds was assessed based on the pharmacokinetic parameters of absorption, distribution, metabolism, and excretion (ADME). Lipinski&#x2019;s Rule of Five (Ro5), which states that a compound should have a molecular weight of less than 500&#xa0;Da, an octanol-water partition coefficient (LogP) of less than 5, fewer than 5 hydrogen bond donors, and fewer than 10 hydrogen bond acceptors, was used to compute the molecular descriptors (<xref ref-type="bibr" rid="B26">Lipinski et al., 2012</xref>). Ro5 provides insight into a compound&#x2019;s potential for absorption in the body, distribution to the appropriate target tissue or organ, metabolism, and eventual excretion from the body. To ensure a more uniform distribution of EC<sub>50</sub> data, EC<sub>50</sub> values were converted to a negative logarithmic scale (i.e., -log10), resulting in the pEC<sub>50</sub> metric.</p>
</sec>
<sec id="s2-1-3">
<title>2.1.3 Model building, training, and deployment</title>
<p>Selected molecular descriptors were used as input features to build the model. The model was built using the Random Forest algorithm to distinguish between agonists and nonagonists. Fingerprint descriptors were generated using PaDEL (<xref ref-type="bibr" rid="B57">Yap, 2011</xref>), and data matrices were prepared accordingly. Features with low variance were removed from the dataset and divided in an 80:20 ratio for training purposes. To prevent potential bias arising from a single data split in constructing predictive models, the models were developed using 100 independent data splits (<xref ref-type="bibr" rid="B40">Puzyn et al., 2011</xref>). The optimised ML model was deployed in the form of an offline application using Streamlit to screen the COCONUT (COlleCtion of Open Natural prodUcTs) database (<ext-link ext-link-type="uri" xlink:href="https://coconut.naturalproducts.net/">https://coconut.naturalproducts.net</ext-link>), predicting potential TGR5 agonists based on their molecular features (<xref ref-type="bibr" rid="B51">Sorokina et al., 2021</xref>). More than four hundred thousand natural compounds that have been sourced from open and free sources are stored in the COCONUT database (<xref ref-type="bibr" rid="B13">Capecchi and Reymond, 2021</xref>).</p>
</sec>
</sec>
<sec id="s2-2">
<title>2.2 Molecular docking</title>
<sec id="s2-2-1">
<title>2.2.1 Ligand and receptor preparation</title>
<sec id="s2-2-1-1">
<title>2.2.1.1 Ligand Preparation</title>
<p>The SMILES of these compounds were obtained and converted to the 2D format using Datawarrior and prepared using the LigPrep module in Schr&#xf6;dinger. This tool was employed to generate the most probable protonation states at physiological pH (7.0 &#xb1; 2.0), ensure the correct stereochemistry, and minimise the energy of the ligand structures using the OPLS4 force field.</p>
</sec>
<sec id="s2-2-1-2">
<title>2.2.1.2 Protein preparation</title>
<p>The crystal structure of the TGR5 receptor (PDBID:7CFN) (<xref ref-type="bibr" rid="B56">Yang et al., 2020</xref>) was downloaded from the Protein Data Bank (PDB) and imported into Maestro (<xref ref-type="bibr" rid="B46">Schrodinger, 2021</xref>). The Protein Preparation Wizard was used to prepare the downloaded protein, which involved removing water molecules beyond 5&#xa0;&#xc5; from the binding site, adding missing hydrogen atoms, assigning proper bond orders, adjusting protonation states of ionisable residues, and minimising the receptor using the OPLS4 force field to relieve steric clashes and optimise geometry. A grid box was generated around the active site where the ligands were docked.</p>
</sec>
</sec>
<sec id="s2-2-2">
<title>2.2.2 Molecular docking</title>
<p>The prepared ligands were docked into the active site of TGR5 using the Glide tool in Schr&#xf6;dinger (<xref ref-type="bibr" rid="B46">Schrodinger, 2021</xref>). SP (standard precision) and XP (extra-precision) protocols were applied. The results were analysed by examining their binding energies to TGR5. 295 compounds had lower binding energies compared to the co-crystallised ligand. The top 4 ligands with the lowest docking scores were selected for succeeding molecular dynamics simulations.</p>
</sec>
<sec id="s2-2-3">
<title>2.2.3 Validation of docking protocol</title>
<p>The docking protocol was validated by re-docking the co-crystallised ligand into the active site of the TGR5 protein and calculating the RMSD of the two poses (<xref ref-type="bibr" rid="B48">Shivanika et al., 2020</xref>).</p>
</sec>
</sec>
<sec id="s2-3">
<title>2.3 Molecular dynamics simulation</title>
<sec id="s2-3-1">
<title>2.3.1 System setup</title>
<p>The simulation system was prepared using the Desmond System Setup tool. The TGR5-ligand complexes obtained from docking studies were embedded in a POPC (300k) membrane bilayer. Appropriate ions were added to neutralise the system. Energy minimisation was performed to remove any steric clashes, followed by equilibration to stabilise the temperature and pressure of the system.</p>
<p>The protein-ligand complex was solvated in an orthorhombic simulation box filled with explicit TIP3P water molecules. The buffer distance between the complex and edge of the simulation box was set to 10&#xa0;&#xc5; to avoid boundary effects, and 0.15&#xa0;M NaCl was added to neutralise the system and mimic physiological conditions. The OPLS4 force field was applied to describe the interactions between atoms in the system, including the protein, ligand, and solvent molecules. Before carrying out MD simulation, energy minimisation was performed to remove any steric clashes or bad contacts introduced during the system setup.</p>
</sec>
<sec id="s2-3-2">
<title>2.3.2 Simulation run</title>
<p>The simulations were conducted under a constant number of particles, pressure (1&#xa0;atm), and temperature (300&#xa0;K) using the Desmond module of the Schrodinger software. The model system was relaxed before simulation and equilibrated, after which a 100&#xa0;ns production run was carried out, with coordinates recorded every 100&#xa0;ps for subsequent analysis. The simulation trajectory was monitored to ensure system stability throughout the run. MDS was carried out on a GPU-enabled Linux operating system.</p>
</sec>
<sec id="s2-3-3">
<title>2.3.3 Post-simulation trajectory analysis</title>
<p>The trajectory was analysed to assess the binding stability, interaction energy, and conformational dynamics of the TGR5-ligand complexes. This analysis helps to identify the most promising TGR5 agonist for further experimental validation. The simulation trajectories were analysed using the simulation interaction diagram tool in Schr&#xf6;dinger. Key metrics included:<list list-type="simple">
<list-item>
<p>- Root Mean Square Deviation (RMSD): To evaluate the stability of the protein-ligand complex.</p>
</list-item>
<list-item>
<p>- Root Mean Square Fluctuation (RMSF): To analyse the flexibility of individual residues in the receptor.</p>
</list-item>
<list-item>
<p>- Radius of gyration (RoG): To measure the extendedness of a ligand, it is equivalent to its principal moment of inertia.</p>
</list-item>
<list-item>
<p>- Intramolecular hydrogen bonds (intraHB): the number of internal hydrogen bonds within a ligand molecule.</p>
</list-item>
<list-item>
<p>- Ligand-Protein interactions: To monitor the types of interactions (e.g., hydrogen bonds, hydrophobic contacts) between the ligand and receptor throughout the simulation.</p>
</list-item>
</list>
</p>
</sec>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>3 Results</title>
<sec id="s3-1">
<title>3.1 Chemical space analysis of TGR5 activators</title>
<p>A total of 518 active, 187 inactive, and 190 intermediate compounds were identified after the data preparation step (<xref ref-type="fig" rid="F2">Figure 2A</xref>). The two bioactivity classes span similar chemical spaces, as shown by the scatter plot of MW vs. LogP (<xref ref-type="fig" rid="F2">Figure 2B</xref>). Considering the pEC<sub>50</sub> values (<xref ref-type="fig" rid="F2">Figure 2C</xref>), the actives and inactives displayed statistically significant differences, which was to be expected since threshold values (EC<sub>50</sub> &#x3c; 1000&#xa0;nM &#x3d; Actives and EC<sub>50</sub> &#x3e; 10,000&#xa0;nM &#x3d; Inactives, corresponding to pEC<sub>50</sub> &#x3e; 6 &#x3d; Actives and pEC<sub>50</sub> &#x3c; 5 &#x3d; Inactives) were used to define actives and inactives.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>
<bold>(A)</bold> Frequency plot of the two bioactivity classes <bold>(B)</bold> scatter plot of MW versus LogP and <bold>(C)</bold> box plot showing the distribution of pEC<sub>50</sub> values of the two bioactivity classes.</p>
</caption>
<graphic xlink:href="fchem-12-1503593-g002.tif"/>
</fig>
</sec>
<sec id="s3-2">
<title>3.2 Lipinski&#x2019;s descriptors</title>
<p>
<xref ref-type="fig" rid="F3">Figure 3</xref> displays the box plots of Lipinski&#x2019;s descriptors. Of the four Lipinski descriptors (MW, LogP, NumHDonors, and NumHAcceptors), only LogP exhibited no difference between the actives and inactives, while the other three descriptors (MW, NumHDonors, and NumHAcceptors) showed statistically significant differences between the active and inactive groups (<xref ref-type="table" rid="T1">Table 1</xref>).</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Box plots of TGR5 agonists using Lipinski&#x2019;s descriptors: LogP, molecular weight (MW), number of hydrogen acceptors (NumHAcceptors), and number of hydrogen donors (NumHDonors).</p>
</caption>
<graphic xlink:href="fchem-12-1503593-g003.tif"/>
</fig>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Statistical analysis &#x7c; Mann-Whitney U test.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left"/>
<th align="left">Descriptor</th>
<th align="left">Statistics</th>
<th align="left">P value</th>
<th align="left">Alpha</th>
<th align="left">Interpretation</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">1</td>
<td align="left">pEC<sub>50</sub>
</td>
<td align="left">100,170.0</td>
<td align="left">7.281833e-93</td>
<td align="left">0.05</td>
<td align="left">Different distribution (reject H0)</td>
</tr>
<tr>
<td align="left">2</td>
<td align="left">Molecular weight</td>
<td align="left">44,041.0</td>
<td align="left">0.013695</td>
<td align="left">0.05</td>
<td align="left">Different distribution (reject H0)</td>
</tr>
<tr>
<td align="left">3</td>
<td align="left">LogP</td>
<td align="left">40,977.0</td>
<td align="left">0.000203</td>
<td align="left">0.05</td>
<td align="left">Different distribution (reject H0)</td>
</tr>
<tr>
<td align="left">4</td>
<td align="left">NumHDonors</td>
<td align="left">40,126.5</td>
<td align="left">0.000017</td>
<td align="left">0.05</td>
<td align="left">Different distribution (reject H0)</td>
</tr>
<tr>
<td align="left">5</td>
<td align="left">NumHAcceptors</td>
<td align="left">56,090.5</td>
<td align="left">0.012607</td>
<td align="left">0.05</td>
<td align="left">Different distribution (reject H0)</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-3">
<title>3.3 Machine learning model to predict TGR5 agonists</title>
<p>
<xref ref-type="fig" rid="F4">Figure 4A</xref> shows the resulting scatterplot of the regression model built using the random forest algorithm. The regression model score (r<sup>2</sup>) is given as 0.40. <xref ref-type="fig" rid="F4">Figure 4B</xref> shows the predicted pEC<sub>50</sub> values of the training data. The mean squared error (MSE) and coefficient of determination (R<sup>2</sup>) for model performance are 0.34 and 0.80, respectively. <xref ref-type="fig" rid="F5">Figure 5</xref> shows a visual representation of the model performance. This shows that the model had a high r<sup>2</sup> and low root-mean-square error value.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Scatter plots of <bold>(A)</bold> regression model using random forest algorithm <bold>(B)</bold>: experimental vs. predicted pEC<sub>50</sub> for training data.</p>
</caption>
<graphic xlink:href="fchem-12-1503593-g004.tif"/>
</fig>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Comparison of the performance of machine learning algorithms against R-squared <bold>(A)</bold>, RMSE <bold>(B)</bold>, and time taken <bold>(C)</bold>, respectively.</p>
</caption>
<graphic xlink:href="fchem-12-1503593-g005.tif"/>
</fig>
<p>ML-based prediction identified 340,364 compounds with potential activity towards TGR5 having EC<sub>50</sub> values ranging from 4.0&#x2013;6.9. Only compounds with EC<sub>50</sub> values between 4.0 and 4.9 were selected for docking, yielding 6,656 compounds in total. The bioactivity predictions of just the four top-scoring compounds selected in this study are displayed in <xref ref-type="table" rid="T2">Table 2</xref>.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Predicted EC<sub>50</sub> values of the four top-scoring compounds from the screening of the COCONUT database.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">COCONUT ID</th>
<th align="center">Predicted pEC<sub>50</sub>
</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">CNP0209363</td>
<td align="center">4.99</td>
</tr>
<tr>
<td align="center">CNP0424850</td>
<td align="center">4.97</td>
</tr>
<tr>
<td align="center">CNP0417335</td>
<td align="center">4.91</td>
</tr>
<tr>
<td align="center">CNP0224616</td>
<td align="center">4.90</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-4">
<title>3.4 Molecular docking reveals the binding energy of lead compounds</title>
<p>
<xref ref-type="fig" rid="F6">Figure 6</xref> shows the 3D structure of TGR5 protein downloaded from the protein data bank (PDBID: 7CFN) in complex with its co-crystallized ligand. After re-docking the co-crystalized ligand into the TGR5 active site, the calculated RMSD value between the docked and re-docked pose was given as 1.42&#xa0;&#xc5; (<xref ref-type="fig" rid="F7">Figure 7A</xref>). <xref ref-type="fig" rid="F7">Figure 7B</xref> shows the docked scores of the top four-scoring compounds (also referred to as lead compounds), represented by their COCONUT IDs, CNP0209363, CNP0424850, CNP0417335, CNP0224616, and co-crystalized ligand, given as &#x2212;15.39, &#x2212;14.87, &#x2212;14.17, &#x2212;14.01, and &#x2212;9.01&#xa0;kcal/mol, respectively. <xref ref-type="fig" rid="F8">Figure 8</xref> shows the 2D structure of the lead compounds. All the lead compounds contain an acetal/aminal-like group (X-CH(R)-Y, where X, Y are N, S, or O) that may be acid/base labile, releasing an aldehyde. CNP0417335 and CNP0224616 have an ester group and may undergo hydrolysis at high or low pH.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>3D structure of TGR5 protein (7CFN) in complex with its co-crystallized ligand (INT-777).</p>
</caption>
<graphic xlink:href="fchem-12-1503593-g006.tif"/>
</fig>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>
<bold>(A)</bold> Validation of docking protocol. The co-crystalized ligand (in grey) was redocked (in orange) into the active site of the TGR5 protein and superimposed. The calculated RMSD value between the native and re-docked pose was calulated as 1.42&#xa0;&#xc5;. <bold>(B)</bold> Bar chart showing the docked scores of the lead compounds and the co-crystallized ligand.</p>
</caption>
<graphic xlink:href="fchem-12-1503593-g007.tif"/>
</fig>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>2D structures of the lead compounds from the COCONUT database <bold>(A)</bold> CNP0209363, <bold>(B)</bold> CNP0424850, <bold>(C)</bold> CNP0417335, <bold>(D)</bold> CNP0224616.</p>
</caption>
<graphic xlink:href="fchem-12-1503593-g008.tif"/>
</fig>
<p>
<xref ref-type="fig" rid="F9">Figure 9</xref> shows the molecular interactions of the compounds with the amino acid residues found within the TGR5 binding pocket. An overview of the interactions is provided in <xref ref-type="table" rid="T3">Table 3</xref>. We observed that all the lead compounds formed hydrogen bonding with residue Asn93 during molecular docking.</p>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption>
<p>
<bold>(A)</bold> 3D conformations of the compounds within the active site of TGR5, represented as coloured sticks: orange (INT-777), purple (CNP0209363), red (CNP0424850), green (CNP0417335) and blue (CNP0224616). <bold>(B)</bold> 2D molecular interaction diagrams of INT-777 (a), lead compounds (b. CNP0209363, c. CNP0424850, d. CNP0417335, e. CNP0224616) and TGR5. Hydrogen and hydrophobic bonds are shown. All the lead compounds show binding to residue Asn93.</p>
</caption>
<graphic xlink:href="fchem-12-1503593-g009.tif"/>
</fig>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Overview of interacting amino acid residues and bond types of the compounds and TGR5 from molecular docking studies.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Compound name</th>
<th align="center">Docking scores (kcal/mol)</th>
<th align="left">Interacting amino acid residue</th>
<th align="left">Bond type</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">INT-777</td>
<td align="center">&#x2212;9.01</td>
<td align="left">Tyr 89<break/>Tyr 240<break/>Ser 247<break/>Leu 71<break/>Tyr 89<break/>Pro 92<break/>Phe 96<break/>Leu 97<break/>Tyr 240</td>
<td align="left">Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond</td>
</tr>
<tr>
<td align="left">CNP0209363</td>
<td align="center">&#x2212;15.39</td>
<td align="left">Ser 157<break/>Ser 247<break/>Asn 93<break/>Leu 74<break/>Tyr 89<break/>Leu 71<break/>Pro 92<break/>Phe 96<break/>Leu 97<break/>Leu 166<break/>Val 170<break/>Tyr 240<break/>Leu 244<break/>Tyr 251</td>
<td align="left">Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond</td>
</tr>
<tr>
<td align="left">CNP0424850</td>
<td align="center">&#x2212;14.87</td>
<td align="left">Ala 250<break/>Ser 247<break/>Asn 93<break/>Pro 259<break/>Pro 255<break/>Val 248<break/>Leu 244<break/>Tyr 240<break/>Leu 266<break/>Leu 262<break/>Leu 263<break/>Leu 71<break/>Leu 74</td>
<td align="left">Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond</td>
</tr>
<tr>
<td align="left">CNP0417335</td>
<td align="center">&#x2212;14.14</td>
<td align="left">Asn 93<break/>Thr 243<break/>Pro 259<break/>Val 248<break/>Ala 250<break/>Tyr 251<break/>Tyr 89<break/>Pro 92<break/>Phe 96<break/>Leu 97<break/>Leu 166<break/>Tyr 240<break/>Leu 262<break/>Leu 71<break/>Leu 74<break/>Leu 266</td>
<td align="left">Hydrogen bond<break/>Hydrogen bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond</td>
</tr>
<tr>
<td align="left">CNP0224616</td>
<td align="center">&#x2212;14.01</td>
<td align="left">Ser 247<break/>Leu 74<break/>Asn 93<break/>Tyr 240<break/>Ser 157<break/>Leu 71<break/>Leu 262<break/>Leu 263<break/>Leu 266<break/>Ala 250<break/>Leu 244<break/>Leu 97<break/>Phe 96<break/>Val 170<break/>Tyr 89<break/>Tyr 240<break/>Pro 92<break/>Leu 166</td>
<td align="left">Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond<break/>Hydrophobic bond</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-5">
<title>3.5 Molecular dynamics simulation</title>
<p>The kinetics of the TGR5-compound complex was investigated using molecular dynamics simulations to assess the bond configuration stability after the binding of lead compounds within the protein cavity. Simulations were conducted over a 100&#xa0;ns period for the co-ligand (INT-777) and the four lead compounds. The thermodynamic stability of these complex systems was analysed using three key parameters: root mean square deviation (RMSD), root mean square fluctuation (RMSF), and radius of gyration (RoG), all of which were monitored throughout the molecular dynamics simulation.</p>
<p>As shown in <xref ref-type="fig" rid="F10">Figure 10</xref>, the RMSD of the TGR5 protein in its apo state demonstrated instability throughout the 100&#xa0;ns simulation but became more stable upon binding to the co-ligand. Moreover, when the TGR5 protein was bound to the lead compounds, stability was observed within the range of 1&#xa0;&#xc5; to 3&#xa0;&#xc5; after the 25&#xa0;ns mark.</p>
<fig id="F10" position="float">
<label>FIGURE 10</label>
<caption>
<p>RMSD trajectories of TGR5 in the apo state and complex with INT-777, CNP0209363, CN 0424850, CNP0417335, and CNP0224616. Simulations were performed over a 100&#xa0;ns&#xa0;(nanosecond) duration.</p>
</caption>
<graphic xlink:href="fchem-12-1503593-g010.tif"/>
</fig>
<p>Among the lead compounds, CNP0224616 exhibited the highest stability, with an RMSD value of approximately 0.8&#xa0;&#xc5;, compared to the co-ligand (INT-777), which showed an RMSD of 0.6&#xa0;&#xc5; CNP0209363, however, displayed lower stability, with its RMSD fluctuating between 1&#xa0;&#xc5; and 2.2&#xa0;&#xc5;, throughout the 100 ns simulation. Meanwhile, CNP0417335 and CNP0424850 stabilised after 10&#xa0;ns and 25&#xa0;ns, with respective RMSD values of about 1.8&#xa0;&#xc5; and 2.7&#xa0;&#xc5; (<xref ref-type="fig" rid="F10">Figure 10</xref>).</p>
<p>RMSF values provide insight into the magnitude of fluctuations for each residue in a protein; higher RMSF values indicate greater flexibility, and lower values suggest rigidity. <xref ref-type="fig" rid="F11">Figure 11</xref> shows that RMSF values between 2&#xa0;&#xc5; and 5&#xa0;&#xc5; were recorded during the 100&#xa0;ns simulation, and the RMSF profiles of the co-ligand (INT-777) were comparable to those of the lead compounds.</p>
<fig id="F11" position="float">
<label>FIGURE 11</label>
<caption>
<p>RMSF trajectories of TGR5 in the apo state and complex with INT-777, CNP0209363, CNP0424850, CNP0417335 and CNP0224616.</p>
</caption>
<graphic xlink:href="fchem-12-1503593-g011.tif"/>
</fig>
<p>Another parameter used to assess structural stability is the radius of gyration (RoG). <xref ref-type="fig" rid="F12">Figure 12</xref> illustrates the stability trends of the lead compounds and the co-ligand. CNP0417335 and CNP0224616 initially displayed slight fluctuations during the first 10&#xa0;ns but stabilised for the remainder of the simulation, similar to the co-ligand, which remained stable around 4.6&#xa0;&#xc5;. CNP0417335 and CNP0224616 stabilised at 4.7&#xa0;&#xc5; and 4.6&#xa0;&#xc5;, respectively. In contrast, CNP0424850 reached stability only after 50&#xa0;ns, with a value close to 5&#xa0;&#xc5;, while CNP0209363 showed little to no stability throughout the simulation.</p>
<fig id="F12" position="float">
<label>FIGURE 12</label>
<caption>
<p>Radius of gyration (RoG) of the compounds in complex with TGR5.</p>
</caption>
<graphic xlink:href="fchem-12-1503593-g012.tif"/>
</fig>
<p>
<xref ref-type="fig" rid="F13">Figure 13</xref> shows the intramolecular hydrogen bonds within the compounds. Only the lead compounds showed intramolecular hydrogen bonding up to a magnitude of 4. INT-777 showed no intramolecular hydrogen bonding during the simulation run.</p>
<fig id="F13" position="float">
<label>FIGURE 13</label>
<caption>
<p>Only the lead compounds showed the presence of intramolecular hydrogen bonds present within the compounds. Only the lead compounds showed the presence of hydrogen bonds.</p>
</caption>
<graphic xlink:href="fchem-12-1503593-g013.tif"/>
</fig>
<p>
<xref ref-type="fig" rid="F14">Figure 14</xref> shows the distribution of hydrogen bonds, hydrophobic bonds, ionic bonds and water bridges formed between the compounds and TGR5 during MDS. All the compounds showed binding to TGR5 via hydrogen bonds, hydrophobic bonds, and water bridges. Only INT-777, CNP0424850 and CNP0224616 showed ionic bonding via Gln253 residue.</p>
<fig id="F14" position="float">
<label>FIGURE 14</label>
<caption>
<p>Protein-ligand contacts between TGR5 and the compounds during simulation run. The figure shows protein interactions with the ligand. The interactions are categorized into hydrogen bonds, hydrophobic bond, ionic bonds and water bridges. The bar charts show the amount of time a specific interaction is sustained.</p>
</caption>
<graphic xlink:href="fchem-12-1503593-g014.tif"/>
</fig>
<p>
<xref ref-type="fig" rid="F15">Figure 15</xref> shows the ligand-protein contacts made during simulation. An overview of the interactions is provided in <xref ref-type="table" rid="T4">Table 4</xref>. All the compounds showed binding with the Ser247 residue; this interaction was also observed from molecular docking studies. Only CNP0424850 and CNP0417335 showed pi-pi stacking.</p>
<fig id="F15" position="float">
<label>FIGURE 15</label>
<caption>
<p>Ligand-protein contacts between the compounds and TGR5 during simulation run <bold>(A)</bold> INT-777; <bold>(B)</bold> CNP0209363; <bold>(C)</bold> CNP0424850; <bold>(D)</bold> CNP0417335; <bold>(E)</bold> CNP0224616. The figure shows a schematic detail of the interactions that occur for more than 30% of the simulation time.</p>
</caption>
<graphic xlink:href="fchem-12-1503593-g015.tif"/>
</fig>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Overview of the interacting amino acid residues and bond types of the compounds and TGR5 during MDS.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Compound name</th>
<th align="center">Interacting amino acid residue</th>
<th align="left">Bond type</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">INT-777</td>
<td align="center">Trp 75<break/>Gln 253<break/>Leu 74<break/>Cys 155<break/>Tyr 89<break/>Ser 157<break/>Ser 247<break/>Tyr 240</td>
<td align="left">Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond</td>
</tr>
<tr>
<td align="center">CNP0209363</td>
<td align="center">Ser 157<break/>Ser 247<break/>Pro 259</td>
<td align="left">Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond</td>
</tr>
<tr>
<td align="center">CNP0424850</td>
<td align="center">Glu 169<break/>Ser 247<break/>Asn 93<break/>Ser 270<break/>Leu 266<break/>Phe 96</td>
<td align="left">Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>&#x3c0;-&#x3c0; stacking</td>
</tr>
<tr>
<td align="center">CNP0417335</td>
<td align="center">Ser 270<break/>Thr 243<break/>Asn 93<break/>Pro 259<break/>Ser 247<break/>Leu 71<break/>Ala 67<break/>Phe 96</td>
<td align="left">Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>&#x3c0;-&#x3c0; stacking</td>
</tr>
<tr>
<td align="center">CNP0224616</td>
<td align="center">Ser 247<break/>Leu 71<break/>Ser 157<break/>Tyr 89</td>
<td align="left">Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond<break/>Hydrogen bond</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>4 Discussion</title>
<p>Type 2 diabetes is a leading cause of mortality (<xref ref-type="bibr" rid="B1">Abdul Basith Khan et al., 2020</xref>). Despite the therapeutic advancement in this disease management, imbalance in glucose homeostasis and energy expenditure associated with the progression of the diseases remains a challenge (<xref ref-type="bibr" rid="B29">Mirzadeh et al., 2022</xref>; <xref ref-type="bibr" rid="B42">Reed et al., 2021</xref>; <xref ref-type="bibr" rid="B12">B&#xfc;sing et al., 2019</xref>; <xref ref-type="bibr" rid="B52">Stein et al., 2013</xref>). In this study, predictive machine learning-based models, molecular docking, and molecular dynamics simulation were used in the identification of TGR5 agonists for the management of type 2 diabetes.</p>
<p>Compounds with their corresponding EC<sub>50</sub> values exhibiting biological activity towards TGR5 were downloaded from the ChEMBL database. Considering the biological activity of the compounds, they were characterised as either active or inactive. The ML evaluation of TGR5 agonists showed that the molecular weight (MW), number of hydrogen bond donors (nHDonors), and number of hydrogen bond acceptors (nHAcceptors) were the significant descriptors between active and inactive compounds (<xref ref-type="bibr" rid="B44">Sasaki et al., 2023</xref>). This observation can be further compared with drug-likeness principles such as the Lipinski&#x2019;s Rule of Five, where smaller MW and ideal hydrogen bonding are efficient for pharmacokinetics and biopharmaceutical availability (<xref ref-type="bibr" rid="B11">Brueckner et al., 2024</xref>). Nevertheless, some bioactive natural compounds have higher molecular weight (<xref ref-type="bibr" rid="B22">Feher and Schmidt, 2003</xref>; <xref ref-type="bibr" rid="B16">Clardy and Walsh, 2004</xref>). Besides meeting the Ro5 criteria, natural products with high molecular masses have penetrated the pharmaceutical markets as approved oral drugs (<xref ref-type="bibr" rid="B49">Shultz, 2018</xref>; <xref ref-type="bibr" rid="B39">Price et al., 2024</xref>).</p>
<p>Active site residues of the crystal structure of TGR5 in complex with its co-crystallised ligand, INT-777, are Leu74, Tyr89, Phe161, Leu166, Tyr240, Thr 243, Leu244, Ser247, Tyr251, Leu262, Leu263, Leu266, and Ser270 as reported by <xref ref-type="bibr" rid="B56">Yang et al. (2020)</xref>. The docking results show that all the compounds were positioned within the active site of TGR5. It also showed that hydrogen bonding and hydrophobic interactions are important in TGR5 receptor and agonist binding. Particularly, residues such as Tyr240 and Asp348 were predicted to be critical in stabilising the ligand-receptor complex, supporting previous findings on TGR5 activation (<xref ref-type="bibr" rid="B24">Guo et al., 2016</xref>). Nevertheless, the flexibility of that binding site remains a major problem for predicting the binding affinities, and to overcome that problem, dynamic studies are required in order to capture the conformational changes of the receptor upon the ligand binding (<xref ref-type="bibr" rid="B30">Mursal et al., 2024</xref>).</p>
<p>Molecular dynamics simulations further validated the stability of these interactions, showing that the identified lead compounds formed stable complexes with TGR5 throughout the simulation period. RMSD and RMSF are critical indicators of structural stability and flexibility for a simulation (<xref ref-type="bibr" rid="B3">Ahmad et al., 2020</xref>). According to <xref ref-type="bibr" rid="B50">Sindhu and Srinivasan (2015)</xref>, smaller RMSD values for backbone atoms suggest that the predicted structural models closely match experimental data, indicating higher model accuracy. In contrast, larger RMSD values point to greater deviations and reduced accuracy. This is important in an effort to document the idea that potential drugs do not relinquish their efficiency when exposed to tangible physiology (<xref ref-type="bibr" rid="B11">Brueckner et al., 2024</xref>). Simulation studies show compound stability within the TGR5 binding pocket, especially for CNP0417335 and CNP0224616; however, <italic>in vivo</italic> and/or <italic>in vitro</italic> experimental validation is necessary to determining the pharmacokinetic and toxicity profiles of these compounds in biological systems. Intramolecular hydrogen bonds may have stabilised the bioactive conformation of the ligands, which might have led to stronger association observed between the lead compounds and TGR5. These bonds could have acted by lowering the translational and conformational entropy during binding (<xref ref-type="bibr" rid="B17">Davoren et al., 2016</xref>), resulting in lower binding energies. Water bridges are also an excellent way to manage protein-ligand complexes; these bridges exist where one or more water molecules are present between the protein and the ligand. Water bridges could have facilitated the formation of a water tunnel in TGR5 during the simulation, as mentioned by <xref ref-type="bibr" rid="B36">Olaposi et al. (2019)</xref>, leading to the stability of the complexes.</p>
<p>The development of effective TGR5 agonists has been hampered due to gastrointestinal side effects (<xref ref-type="bibr" rid="B58">Zhuo et al., 2024</xref>). For instance, INT-777 was found to activate TGR5; however, when tested in the first phases, it was discovered that it poses negative effects on the gastrointestinal tract (<xref ref-type="bibr" rid="B24">Guo et al., 2016</xref>). For this reason, there is a need to find selective agonists that do not possess such undesired activity.</p>
<p>Machine learning has enhanced drug discovery and development by increasing efficiency and prediction accuracy. Incorporating big chemical data together with artificial neural network algorithms has enhanced the speed and accuracy of the predictions compared to conventional methods (<xref ref-type="bibr" rid="B54">van Heerden et al., 2023</xref>). However, as pointed out in this analysis, existing ML models are vastly dependent on the quality and size of data used in their development, and this has reduced the generality of models in practice. Molecular docking using TGR5 as a subject can also be enhanced by the help of special structural techniques such as cryo-electron microscopy or X-ray crystallography to gain more information regarding the active conformation of the receptor. The integration of these experimental methodologies with MD simulations may improve the reliability of the binding energy predictions and would be beneficial for the design of more selective TGR5 agonists (Brueckner et al., 2024).</p>
</sec>
<sec sec-type="conclusion" id="s5">
<title>5 Conclusion</title>
<p>According to this study, new TGR5 agonists for T2D could be developed via ML, MD and MDS techniques. Interestingly, the computational methods studied here illuminate new directions in the search for TGR5 agonists; the actual effectiveness of these approaches remains contingent on the experimental testing of predicted compounds. The integration of these techniques will provide a framework for designing novel TGR5 agonists, and improve the accuracy of identification of lead compounds for T2D treatment.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s6">
<title>Data availability statement</title>
<p>The dataset analyzed during the current study as a case study is publicly available at <ext-link ext-link-type="uri" xlink:href="https://github.com/omicscodeathon/tgr5t2d/tree/main/data">https://github.com/omicscodeathon/tgr5t2d/tree/main/data</ext-link>. The data supporting the results reported in this manuscript is included within the article and its additional files. The generated progress reports are in HTML format and can be viewed using any preferred browser such as Chrome, Safari, Internet Explorer and Firefox. The Project repository which also includes the entire code and other requirements can be downloaded from <ext-link ext-link-type="uri" xlink:href="https://github.com/omicscodeathon/tgr5t2d">https://github.com/omicscodeathon/tgr5t2d</ext-link>. The guidelines for implementing this tool and related updates, are available at: <ext-link ext-link-type="uri" xlink:href="https://github.com/omicscodeathon/tgr5t2d/blob/main/README.md">https://github.com/omicscodeathon/tgr5t2d/blob/main/README.md</ext-link>.</p>
</sec>
<sec sec-type="author-contributions" id="s7">
<title>Author contributions</title>
<p>OE: Conceptualization, Data curation, Formal Analysis, Investigation, Methodology, Project administration, Resources, Validation, Visualization, Writing&#x2013;original draft, Writing&#x2013;review and editing. CO: Writing&#x2013;original draft, Writing&#x2013;review and editing, Investigation, Project administration. HN: Data curation, Methodology, Resources, Writing&#x2013;original draft, Writing&#x2013;review and editing. OK: Writing&#x2013;review and editing, Writing&#x2013;original draft. AM: Writing&#x2013;review and editing, Data curation, Formal Analysis, Software. FM: Writing&#x2013;review and editing. AY: Writing&#x2013;review and editing. OA: Project administration, Supervision, Writing&#x2013;review and editing, Resources.</p>
</sec>
<sec sec-type="funding-information" id="s8">
<title>Funding</title>
<p>The author(s) declare that no financial support was received for the research, authorship, and/or publication of this article.</p>
</sec>
<ack>
<p>The authors thank the National Institutes of Health (NIH) Office of Data Science Strategy (ODSS) for their immense support before and during the October 2024 Omics codeathon organized by the African Society for Bioinformatics and Computational Biology (ASBCB).</p>
</ack>
<sec sec-type="COI-statement" id="s9">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s10">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
</sec>
<sec sec-type="disclaimer" id="s11">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abdul Basith Khan</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Hashim</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>King</surname>
<given-names>J. K.</given-names>
</name>
<name>
<surname>Govender</surname>
<given-names>R. D.</given-names>
</name>
<name>
<surname>Mustafa</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Al Kaabi</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Epidemiology of type 2 diabetes&#x2014;global burden of disease and forecasted trends</article-title>. <source>J. Epidemiol. Glob. health</source> <volume>10</volume> (<issue>1</issue>), <fpage>107</fpage>&#x2013;<lpage>111</lpage>. <pub-id pub-id-type="doi">10.2991/jegh.k.191028.001</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abolo</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Ssenkaali</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Mulumba</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Awe</surname>
<given-names>O. I.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Exploring the causal effect of omega-3 polyunsaturated fatty acid levels on the risk of type 1 diabetes: a Mendelian randomization study</article-title>. <source>Front. Genet.</source> <volume>15</volume>, <fpage>1353081</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2024.1353081</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ahmad</surname>
<given-names>S. S.</given-names>
</name>
<name>
<surname>Sinha</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ahmad</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Khalid</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Choi</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Study of caspase 8 inhibition for the management of Alzheimer&#x2019;s disease: a molecular docking and dynamics simulation</article-title>. <source>Molecules</source> <volume>25</volume> (<issue>9</issue>), <fpage>2071</fpage>. <pub-id pub-id-type="doi">10.3390/molecules25092071</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alaya</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Baraket</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Adediran</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Cuttler</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Ajiboye</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Kivumbi</surname>
<given-names>M. T.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Multiple sclerosis stages and their differentially expressed genes: a bioinformatics analysis</article-title>. <source>bioRxiv</source>. <pub-id pub-id-type="doi">10.1101/2024.01.20.576448</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Awe</surname>
<given-names>O. I.</given-names>
</name>
<name>
<surname>En Najih</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Nyamari</surname>
<given-names>M. N.</given-names>
</name>
<name>
<surname>Mukanga</surname>
<given-names>L. B.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Comparative study between molecular and genetic evolutionary analysis tools using African SARS-CoV2 variants</article-title>. <source>Inf. Med. Unlocked</source> <volume>36</volume>, <fpage>101143</fpage>. <pub-id pub-id-type="doi">10.1016/j.imu.2022.101143</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ben Aribi</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Abassi</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Awe</surname>
<given-names>O. I.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>NeuroVar: an open-source tool for gene expression and variation data visualization for biomarkers of neurological diseases</article-title>. <source>Gigabyte</source>. <pub-id pub-id-type="doi">10.46471/gigabyte.143</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bento</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Gaulton</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hersey</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Bellis</surname>
<given-names>L. J.</given-names>
</name>
<name>
<surname>Chambers</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Davies</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>The ChEMBL bioactivity database: an update</article-title>. <source>Nucleic acids Res.</source> <volume>42</volume> (<issue>D1</issue>), <fpage>D1083</fpage>&#x2013;<lpage>D1090</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkt1031</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bhatti</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>Sehrawat</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mishra</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Sidhu</surname>
<given-names>I. S.</given-names>
</name>
<name>
<surname>Navik</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Khullar</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Oxidative stress in the pathophysiology of type 2 diabetes and related complications: current therapeutics strategies and future perspectives</article-title>. <source>Free Radic. Biol. Med.</source> <volume>184</volume>, <fpage>114</fpage>&#x2013;<lpage>134</lpage>. <pub-id pub-id-type="doi">10.1016/j.freeradbiomed.2022.03.019</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bhimanwar</surname>
<given-names>R. S.</given-names>
</name>
<name>
<surname>Lokhande</surname>
<given-names>K. B.</given-names>
</name>
<name>
<surname>Shrivastava</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Singh</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Chitlange</surname>
<given-names>S. S.</given-names>
</name>
<name>
<surname>Mittal</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Identification of potential drug candidates as TGR5 agonist to combat type II diabetes using <italic>in silico</italic> docking and molecular dynamics simulation studies</article-title>. <source>J. Biomol. Struct. Dyn.</source> <volume>41</volume> (<issue>22</issue>), <fpage>13314</fpage>&#x2013;<lpage>13331</lpage>. <pub-id pub-id-type="doi">10.1080/07391102.2023.2173654</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bhimanwar</surname>
<given-names>R. S.</given-names>
</name>
<name>
<surname>Mittal</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>TGR5 agonists for diabetes treatment: a patent review and clinical advancements (2012-present)</article-title>. <source>Expert Opin. Ther. Pat.</source> <volume>32</volume> (<issue>2</issue>), <fpage>191</fpage>&#x2013;<lpage>209</lpage>. <pub-id pub-id-type="doi">10.1080/13543776.2022.1994551</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brueckner</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Shields</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Kirubakaran</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Suponya</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Panda</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Posy</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>MDFit: automated molecular simulations workflow enables high throughput assessment of ligands-protein dynamics</article-title>. <source>ChemRxiv</source> <volume>38</volume>, <fpage>24</fpage>. <pub-id pub-id-type="doi">10.1007/s10822-024-00564-2</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>B&#xfc;sing</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>H&#xe4;gele</surname>
<given-names>F. A.</given-names>
</name>
<name>
<surname>Nas</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hasler</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>M&#xfc;ller</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Bosy-Westphal</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Impact of energy turnover on the regulation of glucose homeostasis in healthy subjects</article-title>. <source>Nutr. Diabetes</source> <volume>9</volume>, <fpage>22</fpage>. <pub-id pub-id-type="doi">10.1038/s41387-019-0089-6</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Capecchi</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Reymond</surname>
<given-names>J. L.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Classifying natural products from plants, fungi or bacteria using the COCONUT database and machine learning</article-title>. <source>J. Cheminform</source> <volume>13</volume>, <fpage>82</fpage>. <pub-id pub-id-type="doi">10.1186/s13321-021-00559-3</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chatterjee</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Khunti</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Davies</surname>
<given-names>M. J.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Type 2 diabetes</article-title>. <source>lancet</source> <volume>389</volume> (<issue>10085</issue>), <fpage>2239</fpage>&#x2013;<lpage>2251</lpage>. <pub-id pub-id-type="doi">10.1016/S0140-6736(17)30058-2</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chikwambi</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Hidjo</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Chikondowa</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Afolabi</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Aketch</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Jayeoba</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Multi-omics data integration approach identifies potential biomarkers for Prostate cancer</article-title>. <source>bioRxiv</source>. <pub-id pub-id-type="doi">10.1101/2023.01.26.522643</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Clardy</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Walsh</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Lessons from natural molecules</article-title>. <source>Nature</source> <volume>432</volume>, <fpage>829</fpage>&#x2013;<lpage>837</lpage>. <pub-id pub-id-type="doi">10.1038/nature03194</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Davoren</surname>
<given-names>J. E.</given-names>
</name>
<name>
<surname>O&#x2019;Neil</surname>
<given-names>S. V.</given-names>
</name>
<name>
<surname>Anderson</surname>
<given-names>D. P.</given-names>
</name>
<name>
<surname>Brodney</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Chenard</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Dlugolenski</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Design and optimization of selective azaindole amide M1 positive allosteric modulators</article-title>. <source>Bioorg. and Med. Chem. Lett.</source> <volume>26</volume> (<issue>2</issue>), <fpage>650</fpage>&#x2013;<lpage>655</lpage>. <pub-id pub-id-type="doi">10.1016/j.bmcl.2015.11.053</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>DeFronzo</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Ferrannini</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Groop</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Henry</surname>
<given-names>R. R.</given-names>
</name>
<name>
<surname>Herman</surname>
<given-names>W. H.</given-names>
</name>
<name>
<surname>Holst</surname>
<given-names>J. J.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Type 2 diabetes mellitus</article-title>. <source>Nat. Rev. Dis. Prim.</source> <volume>1</volume>, <fpage>15019</fpage>. <pub-id pub-id-type="doi">10.1038/nrdp.2015.19</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Deol</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Bashir</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Exploring the complications of type 2 diabetes mellitus: pathophysiology and management strategies</article-title>. <source>EPRA Int. J. Res. Dev. (IJRD)</source> <volume>9</volume> (<issue>7</issue>), <fpage>173</fpage>&#x2013;<lpage>182</lpage>. <pub-id pub-id-type="doi">10.36713/epra17838</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Di Stefano</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Galati</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ortore</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Caligiuri</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Rizzolio</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Ceni</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Machine learning-based virtual screening for the identification of CDK5 inhibitors</article-title>. <source>Int. J. Mol. Sci.</source> <volume>23</volume> (<issue>18</issue>), <fpage>10653</fpage>. <pub-id pub-id-type="doi">10.3390/ijms231810653</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>El Abed</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Baraket</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Nyamari</surname>
<given-names>M. N.</given-names>
</name>
<name>
<surname>Naitore</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Awe</surname>
<given-names>O. I.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Differential expression analysis of miRNAs and mRNAs in epilepsy uncovers potential biomarkers</article-title>. <source>bioRxiv</source>. <pub-id pub-id-type="doi">10.1101/2023.09.11.557132</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Feher</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Schmidt</surname>
<given-names>J. M.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Property distributions: differences between drugs, natural products, and molecules from combinatorial chemistry</article-title>. <source>J. Chem. Inf. Comput. Sci.</source> <volume>43</volume> (<issue>1</issue>), <fpage>218</fpage>&#x2013;<lpage>227</lpage>. <pub-id pub-id-type="doi">10.1021/ci0200467</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gaulton</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hersey</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Nowotka</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bento</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Chambers</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Mendez</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>The ChEMBL database in 2017</article-title>. <source>Nucleic acids Res.</source> <volume>45</volume> (<issue>D1</issue>), <fpage>D945</fpage>&#x2013;<lpage>D954</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkw1074</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guo</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W. D.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y. D.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>TGR5, not only a metabolic regulator</article-title>. <source>Front. physiology</source> <volume>7</volume>, <fpage>646</fpage>. <pub-id pub-id-type="doi">10.3389/fphys.2016.00646</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ikwuka</surname>
<given-names>A. O.</given-names>
</name>
<name>
<surname>Omoju</surname>
<given-names>D. I.</given-names>
</name>
<name>
<surname>Mahanera</surname>
<given-names>O. K.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Profiling of clinical dynamics of type 2 diabetes mellitus in patients: a perspective review</article-title>. <source>World J. Med. Pharm. Res.</source> <volume>5</volume> (<issue>5</issue>), <fpage>210</fpage>&#x2013;<lpage>218</lpage>. <pub-id pub-id-type="doi">10.37022/wjcmpr.v5i5.294</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lipinski</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Lombardo</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Dominy</surname>
<given-names>B. W.</given-names>
</name>
<name>
<surname>Feeney</surname>
<given-names>P. J.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Experimental and computational approaches to estimate solubility and permeability in drug discovery and development settings</article-title>. <source>Adv. drug Deliv. Rev.</source> <volume>64</volume>, <fpage>4</fpage>&#x2013;<lpage>17</lpage>. <pub-id pub-id-type="doi">10.1016/j.addr.2012.09.019</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lun</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bai</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Mechanism of action of the bile acid receptor TGR5 in obesity</article-title>. <source>Acta Pharm. Sin. B</source> <volume>14</volume> (<issue>2</issue>), <fpage>468</fpage>&#x2013;<lpage>491</lpage>. <pub-id pub-id-type="doi">10.1016/j.apsb.2023.11.011</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mansour</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mousa</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Abdelmannan</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Tay</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Hassoun</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Alsafar</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Microvascular and macrovascular complications of type 2 diabetes mellitus: exome wide association analyses</article-title>. <source>Front. Endocrinol.</source> <volume>14</volume>, <fpage>1143067</fpage>. <pub-id pub-id-type="doi">10.3389/fendo.2023.1143067</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mirzadeh</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Faber</surname>
<given-names>C. L.</given-names>
</name>
<name>
<surname>Schwartz</surname>
<given-names>M. W.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Central nervous system control of glucose homeostasis: a therapeutic target for type 2 diabetes?</article-title> <source>Annu. Rev. Pharmacol. Toxicol.</source> <volume>62</volume>, <fpage>55</fpage>&#x2013;<lpage>84</lpage>. <pub-id pub-id-type="doi">10.1146/annurev-pharmtox-052220-010446</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mursal</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ahmad</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Hussain</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Khan</surname>
<given-names>M. F.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Navigating the computational seas: a comprehensive overview of molecular docking software in drug discovery</article-title>. <source>IntechOpen</source>. <pub-id pub-id-type="doi">10.5772/intechopen.1004802</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mwanga</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Obura</surname>
<given-names>H. O.</given-names>
</name>
<name>
<surname>Evans</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Awe</surname>
<given-names>O. I.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Enhanced deep convolutional neural network for SARS-CoV-2 variants classification</article-title>. <source>bioRxiv</source>. <pub-id pub-id-type="doi">10.1101/2023.08.09.552643</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nyamari</surname>
<given-names>M. N.</given-names>
</name>
<name>
<surname>Omar</surname>
<given-names>K. M.</given-names>
</name>
<name>
<surname>Fayehun</surname>
<given-names>A. F.</given-names>
</name>
<name>
<surname>Dachi</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Bwana</surname>
<given-names>B. K.</given-names>
</name>
<name>
<surname>Awe</surname>
<given-names>O. I.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Expression level analysis of ACE2 receptor gene in african-American and non-african-American COVID-19 patients</article-title>. <source>BioRxiv</source>. <pub-id pub-id-type="doi">10.1101/2023.09.11.557129</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nzungize</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Kengne-Ouafo</surname>
<given-names>J. A.</given-names>
</name>
<name>
<surname>Wesonga</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Umuhoza</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Murithi</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Kimani</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Transcriptional profiles analysis of COVID-19 and malaria patients reveals potential biomarkers in children</article-title>. <source>bioRxiv</source>. <pub-id pub-id-type="doi">10.1101/2022.06.30.498338</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Obura</surname>
<given-names>H. O.</given-names>
</name>
<name>
<surname>Mlay</surname>
<given-names>C. D.</given-names>
</name>
<name>
<surname>Moyo</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Karumbo</surname>
<given-names>B. M.</given-names>
</name>
<name>
<surname>Omar</surname>
<given-names>K. M.</given-names>
</name>
<name>
<surname>Sinza</surname>
<given-names>E. M.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Molecular phylogenetics of HIV-1 subtypes in african populations: a case study of sub-saharan african countries</article-title>. <source>bioRxiv</source>. <pub-id pub-id-type="doi">10.1101/2022.05.18.492401</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ogbodo</surname>
<given-names>U. C.</given-names>
</name>
<name>
<surname>Enejoh</surname>
<given-names>O. A.</given-names>
</name>
<name>
<surname>Okonkwo</surname>
<given-names>C. H.</given-names>
</name>
<name>
<surname>Gnanasekar</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Gachanja</surname>
<given-names>P. W.</given-names>
</name>
<name>
<surname>Osata</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Computational identification of potential inhibitors targeting cdk1 in colorectal cancer</article-title>. <source>Front. Chem.</source> <volume>11</volume>, <fpage>1264808</fpage>. <pub-id pub-id-type="doi">10.3389/fchem.2023.1264808</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Olaposi</surname>
<given-names>O. I.</given-names>
</name>
<name>
<surname>Oyekanmi</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Samuel</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Enejoh</surname>
<given-names>O. A.</given-names>
</name>
<name>
<surname>Victor</surname>
<given-names>U. O.</given-names>
</name>
<name>
<surname>Niyi</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Takeda G-protein receptor (TGR)-5 evolves classical active-state conformational signatures in complex with chromolaena odorata-derived flavonoid-5, 7-dihydroxy-6-4-dimethoxyflavanone</article-title>. <source>Curr. Chem. Biol.</source> <volume>13</volume> (<issue>3</issue>), <fpage>212</fpage>&#x2013;<lpage>222</lpage>. <pub-id pub-id-type="doi">10.2174/2212796813666190102102018</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Oluwagbemi</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Awe</surname>
<given-names>O. I.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>A comparative computational genomics of Ebola Virus Disease strains: in-silico Insight for Ebola control</article-title>. <source>Inf. Med. Unlocked</source> <volume>12</volume>, <fpage>106</fpage>&#x2013;<lpage>119</lpage>. <pub-id pub-id-type="doi">10.1016/j.imu.2018.07.004</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ong</surname>
<given-names>K. L.</given-names>
</name>
<name>
<surname>Stafford</surname>
<given-names>L. K.</given-names>
</name>
<name>
<surname>McLaughlin</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Boyko</surname>
<given-names>E. J.</given-names>
</name>
<name>
<surname>Vollset</surname>
<given-names>S. E.</given-names>
</name>
<name>
<surname>Smith</surname>
<given-names>A. E.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Global, regional, and national burden of diabetes from 1990 to 2021, with projections of prevalence to 2050: a systematic analysis for the Global Burden of Disease Study 2021</article-title>. <source>Lancet</source> <volume>402</volume> (<issue>10397</issue>), <fpage>203</fpage>&#x2013;<lpage>234</lpage>. <pub-id pub-id-type="doi">10.1016/s0140-6736(23)01301-6</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Price</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Weinheimer</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Rivkin</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Jenkins</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Nijsen</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Cox</surname>
<given-names>P. B.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Beyond rule of five and PROTACs in modern drug discovery: polarity reducers, chameleonicity, and the evolving physicochemical landscape</article-title>. <source>J. Med. Chem.</source> <volume>67</volume> (<issue>7</issue>), <fpage>5683</fpage>&#x2013;<lpage>5698</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jmedchem.3c02332</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Puzyn</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Mostrag-Szlichtyng</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Gajewicz</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Skrzy&#x144;ski</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Worth</surname>
<given-names>A. P.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Investigating the influence of data splitting on the predictive ability of QSAR/QSPR models</article-title>. <source>Struct. Chem.</source> <volume>22</volume> (<issue>4</issue>), <fpage>795</fpage>&#x2013;<lpage>804</lpage>. <pub-id pub-id-type="doi">10.1007/s11224-011-9757-4</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qin</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Lei</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Machine learning-and structure-based discovery of a novel chemotype as FXR agonists for potential treatment of nonalcoholic fatty liver disease</article-title>. <source>Eur. J. Med. Chem.</source> <volume>252</volume>, <fpage>115307</fpage>. <pub-id pub-id-type="doi">10.1016/j.ejmech.2023.115307</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reed</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Bain</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kanamarlapudi</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>A review of current trends with type 2 diabetes epidemiology, aetiology, pathogenesis, treatments and future perspectives</article-title>. <source>Diabetes, Metabolic Syndrome Obes.</source> <volume>14</volume>, <fpage>3567</fpage>&#x2013;<lpage>3602</lpage>. <pub-id pub-id-type="doi">10.2147/DMSO.S319895</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sadybekov</surname>
<given-names>A. V.</given-names>
</name>
<name>
<surname>Katritch</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Computational approaches streamlining drug discovery</article-title>. <source>Nature</source> <volume>616</volume>, <fpage>673</fpage>&#x2013;<lpage>685</lpage>. <pub-id pub-id-type="doi">10.1038/s41586-023-05905-z</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sasaki</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Ikari</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Hashimoto</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sato</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Identification of &#x3b1;-ionone, nootkatone, and their derivatives as TGR5 agonists</article-title>. <source>Biochem. Biophysical Res. Commun.</source> <volume>653</volume>, <fpage>147</fpage>&#x2013;<lpage>152</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbrc.2023.02.070</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sato</surname>
<given-names>H. C.</given-names>
</name>
<name>
<surname>Genet</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Strehle</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Thomas</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Lobstein</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Wagner</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2007</year>). <article-title>Anti-hyperglycemic activity of a TGR5 agonist isolated from <italic>Olea europaea</italic>
</article-title>. <source>Biochem. Biophysical Res. Commun.</source> <volume>362</volume> (<issue>4</issue>), <fpage>793</fpage>&#x2013;<lpage>798</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbrc.2007.06.130</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="book">
<collab>Schrodinger</collab> (<year>2021</year>). <source>Maestro version 12.8.117 release 2021-2: Glide</source>. <publisher-loc>New York, NY, USA</publisher-loc>: <publisher-name>Schr&#xf6;dinger LLC</publisher-name>.</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sharma</surname>
<given-names>U. K.</given-names>
</name>
<name>
<surname>Pujani</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Anuradha</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Type-II-diabetes mellitus: etiology, epidemiology, risk factors and diagnosis and insight into demography (urban versus rural)</article-title>. <source>Int. J. Health Sci. Res.</source> <volume>14</volume> (<issue>1</issue>), <fpage>283</fpage>&#x2013;<lpage>290</lpage>. <pub-id pub-id-type="doi">10.52403/ijhsr.20240136</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shivanika</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Ragunathan</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Tiwari</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Sumitha</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>P</surname>
<given-names>B. D.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Molecular docking, validation, dynamics simulations, and pharmacokinetic prediction of natural compounds against the SARS-CoV-2 main-protease</article-title>. <source>J. Biomol. Struct. and Dyn.</source> <volume>1</volume>, <fpage>1</fpage>&#x2013;<lpage>27</lpage>. <pub-id pub-id-type="doi">10.1080/07391102.2020.1815584</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shultz</surname>
<given-names>M. D.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Two decades under the influence of the rule of five and the changing properties of approved oral drugs: miniperspective</article-title>. <source>J. Med. Chem.</source> <volume>13</volume> (<issue>4</issue>), <fpage>1701</fpage>&#x2013;<lpage>1714</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jmedchem.8b00686</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sindhu</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Srinivasan</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Exploring the binding properties of agonists interacting with human TGR5 using structural modeling, molecular docking and dynamics simulations</article-title>. <source>RSC Adv.</source> <volume>5</volume> (<issue>19</issue>), <fpage>14202</fpage>&#x2013;<lpage>14213</lpage>. <pub-id pub-id-type="doi">10.1039/C4RA16617E</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sorokina</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Merseburger</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Rajan</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Yirik</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Steinbeck</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>COCONUT online: collection of open natural products database</article-title>. <source>J. Cheminformatics</source> <volume>13</volume> (<issue>1</issue>), <fpage>2</fpage>. <pub-id pub-id-type="doi">10.1186/s13321-020-00478-9</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stein</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Lamos</surname>
<given-names>E. M.</given-names>
</name>
<name>
<surname>Davis</surname>
<given-names>S. N.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>A review of the efficacy and safety of oral antidiabetic drugs</article-title>. <source>Expert Opin. Drug Saf.</source> <volume>12</volume> (<issue>2</issue>), <fpage>153</fpage>&#x2013;<lpage>175</lpage>. <pub-id pub-id-type="doi">10.1517/14740338.2013.752813</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thomas</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Pellicciari</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Pruzanski</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Auwerx</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Schoonjans</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Targeting bile-acid signalling for metabolic diseases</article-title>. <source>Nat. Rev. Drug Discov.</source> <volume>7</volume> (<issue>8</issue>), <fpage>678</fpage>&#x2013;<lpage>693</lpage>. <pub-id pub-id-type="doi">10.1038/nrd2619</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>van Heerden</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Tur&#xf3;n</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Duran-Frigola</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Pillay</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Birkholtz</surname>
<given-names>L.-M.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Machine learning approaches identify chemical features for stage-specific antimalarial compounds</article-title>. <source>bioRxiv</source> <volume>8</volume>, <fpage>43813</fpage>&#x2013;<lpage>43826</lpage>. <pub-id pub-id-type="doi">10.1021/acsomega.3c05664</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wesonga</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Awe</surname>
<given-names>O. I.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>An assessment of traditional and genomic screening in newborns and their applicability for africa</article-title>. <source>Inf. Med. Unlocked</source> <volume>32</volume>, <fpage>101050</fpage>. <pub-id pub-id-type="doi">10.1016/j.imu.2022.101050</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Mao</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ming</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Structural basis of GPBAR activation and bile acid recognition</article-title>. <source>Nature</source> <volume>587</volume> (<issue>7834</issue>), <fpage>499</fpage>&#x2013;<lpage>504</lpage>. <pub-id pub-id-type="doi">10.1038/s41586-020-2569-1</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yap</surname>
<given-names>C. W.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>PaDEL-descriptor: an open source software to calculate molecular descriptors and fingerprints</article-title>. <source>J. Comput. Chem.</source> <volume>32</volume> (<issue>7</issue>), <fpage>1466</fpage>&#x2013;<lpage>1474</lpage>. <pub-id pub-id-type="doi">10.1002/jcc.21707</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhuo</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Yun</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Yin</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Discovery of betulinic acid derivatives as gut-restricted TGR5 agonists: balancing the potency and physicochemical properties</article-title>. <source>Bioorg. Chem.</source> <volume>144</volume>, <fpage>107132</fpage>. <pub-id pub-id-type="doi">10.1016/j.bioorg.2024.107132</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>