<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="review-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Chem.</journal-id>
<journal-title>Frontiers in Chemistry</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Chem.</abbrev-journal-title>
<issn pub-type="epub">2296-2646</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1632046</article-id>
<article-id pub-id-type="doi">10.3389/fchem.2025.1632046</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Chemistry</subject>
<subj-group>
<subject>Review</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Recent advances in AI-based toxicity prediction for drug discovery</article-title>
<alt-title alt-title-type="left-running-head">Lee et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fchem.2025.1632046">10.3389/fchem.2025.1632046</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Lee</surname>
<given-names>Hyundo</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Kim</surname>
<given-names>Jisan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Kim</surname>
<given-names>Ji-Woon</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/3095501/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Lee</surname>
<given-names>Yoonji</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1084715/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Global Innovative Drugs</institution>, <institution>Chung-Ang University</institution>, <addr-line>Seoul</addr-line>, <country>Republic of Korea</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>College of Pharmacy</institution>, <institution>Kyung Hee University</institution>, <addr-line>Seoul</addr-line>, <country>Republic of Korea</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>College of Pharmacy</institution>, <institution>Chung-Ang University</institution>, <addr-line>Seoul</addr-line>, <country>Republic of Korea</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2576939/overview">Xin Wang</ext-link>, Shenzhen Technology University, China</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/344057/overview">Georgios Papamokos</ext-link>, University of Ioannina, Greece</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3081809/overview">Ashwin Dhakal</ext-link>, The University of Missouri, United States</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Ji-Woon Kim, <email>jiwoonkim@khu.ac.kr</email>; Yoonji Lee, <email>yoonjilee@cau.ac.kr</email>
</corresp>
<fn fn-type="equal" id="fn001">
<label>
<sup>&#x2020;</sup>
</label>
<p>These authors have contributed equally to this work</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>08</day>
<month>07</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>13</volume>
<elocation-id>1632046</elocation-id>
<history>
<date date-type="received">
<day>20</day>
<month>05</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>18</day>
<month>06</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Lee, Kim, Kim and Lee.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Lee, Kim, Kim and Lee</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Toxicity, defined as the potential harm a substance can cause to living organisms, requires the implementation of stringent regulatory standards to ensure public safety. These standards involve comprehensive testing frameworks, including hazard identification, dose-response evaluation, exposure assessment, and risk characterization. In drug discovery and development, these processes are often complex, time-consuming, and also resource-intensive. Toxicity-related failures in the later stages of drug development can lead to substantial financial losses, underscoring the need for reliable toxicity prediction during the early discovery phases. The advent of computational approaches has accelerated a shift toward <italic>in silico</italic> modeling, virtual screening, and, notably, artificial intelligence (AI) to identify potential toxicities earlier in the pipeline. Ongoing advances in databases, algorithms, and computational power have further expanded AI&#x2019;s role in pharmaceutical research. Today, AI models are capable of predicting wide range of toxicity endpoints, such as hepatotoxicity, cardiotoxicity, nephrotoxicity, neurotoxicity, and genotoxicity, based on diverse molecular representations ranging from traditional descriptors to graph-based methods. This review provides an in-depth examination of AI-driven toxicity prediction, emphasizing its transformative impact on drug discovery and its growing importance in improving safety assessments.</p>
</abstract>
<kwd-group>
<kwd>artificial intelligence</kwd>
<kwd>drug discovery</kwd>
<kwd>toxicity</kwd>
<kwd>in silico methods</kwd>
<kwd>virtual screening</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Theoretical and Computational Chemistry</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Toxicity refers to the extent to which a substance can cause harm to living organisms, including animals, plants, bacteria, and humans (<xref ref-type="bibr" rid="B28">Duffus, 1993</xref>; <xref ref-type="bibr" rid="B80">McNaught and Wilkinson, 2025</xref>). While many chemicals enhance our quality of life, they can also pose significant toxic risks. To ensure public safety, various regulatory frameworks have been established to mitigate these hazards. Given the potential health risks associated with chemical exposure, thorough evaluation of such substances in the environment is essential. Regulatory standards typically mandate toxicity testing, encompassing hazard identification, dose-response assessment, exposure evaluation, and risk characterization (<xref ref-type="bibr" rid="B59">Krewski et al., 2010</xref>). As part of hazard identification, it is necessary to determine the specific toxicity endpoints associated with each chemical. In parallel, <italic>in vitro</italic> and <italic>in vivo</italic> studies aim to elucidate the conditions under which these toxic effects may occur in humans, often drawing on epidemiological insights. Dose-response assessments examine the relationship between chemical exposure and adverse effects, using benchmarks such as the no-observed-adverse-effect level (NOAEL), lowest-observed-adverse-effect level (LOAEL), and potential carcinogenicity (<xref ref-type="bibr" rid="B86">NRC, 1994</xref>). While this approach focuses on the magnitude of exposure required to produce harmful effects, the adverse outcome pathway (AOP) framework provides a complementary mechanistic perspective (<xref ref-type="bibr" rid="B5">Ankley et al., 2010</xref>). AOPs begin with a molecular initiating event, such as a chemical binding to a receptor, and proceed through a series of causally connected key events (KEs) until an adverse outcome (AO) is reached at the organism level (<xref ref-type="bibr" rid="B112">Villeneuve et al., 2014</xref>). By linking mechanistic insights with experimental data, AOPs exemplify how diverse information sources can be integrated to better understand chemical toxicity (<xref ref-type="bibr" rid="B112">Villeneuve et al., 2014</xref>). This growing emphasis on data integration has also driven the development of AI-based models with both experimental and computational inputs to support early-stage toxicity prediction.</p>
<p>The advent of computational approaches, combined with the growing availability of experimental data, has paved the way for more cost-effective, time-efficient strategies in early-stage drug discovery (<xref ref-type="bibr" rid="B76">Mak and Pichika, 2019</xref>; <xref ref-type="bibr" rid="B110">Vamathevan et al., 2019</xref>). By incorporating AI-based toxicity prediction models into virtual screening pipelines, compounds likely to exhibit toxicity can be filtered out before <italic>in vitro</italic> assays. This strategy increases the success rate of candidates advancing through toxicity evaluations, thereby enhancing the overall efficiency of drug development (<xref ref-type="fig" rid="F1">Figure 1A</xref>). AI models can be trained on large-scale public databases such as ChEMBL (<xref ref-type="bibr" rid="B35">Gaulton et al., 2017</xref>), DrugBank (<xref ref-type="bibr" rid="B120">Wishart et al., 2018</xref>), and BindingDB (<xref ref-type="bibr" rid="B73">Liu et al., 2007</xref>), which contain <italic>in vitro</italic> and <italic>in vivo</italic> experimental results. In addition to open-source datasets, proprietary data generated from <italic>in vitro</italic> assays, <italic>in vivo</italic> studies, clinical trials, and post-marketing surveillance can further enrich these models (<xref ref-type="bibr" rid="B91">Pognan et al., 2023</xref>). Integrating AI-based toxicity prediction into virtual screening and then feeding back the experimental outcomes from downstream studies (<italic>in vitro</italic>, <italic>in vivo</italic>, and clinical), creates a virtuous cycle. This feedback process includes prospective and external validations, which evaluate model performance using newly generated or independent datasets and are essential for demonstrating generalizability and robustness in regulatory submissions. This continuous feedback loop improves model performance over time and supports more informed decision-making in early toxicity assessment (<xref ref-type="bibr" rid="B91">Pognan et al., 2023</xref>).</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Overview of the AI-based toxicity prediction pipeline. <bold>(A)</bold> Integration of AI-based toxicity prediction into the drug development process. <bold>(B)</bold> Workflow of model development, including data collection, preprocessing, algorithm selection, and performance evaluation.</p>
</caption>
<graphic xlink:href="fchem-13-1632046-g001.tif">
<alt-text content-type="machine-generated">Diagram showing the process of AI-based toxicity prediction in drug development, divided into sections A and B. Section A outlines the stages: discovery, preclinical, and clinical research, featuring data feedback and process flow. It highlights in vitro toxicity assays and in vivo studies, leading to human clinical trials. Section B describes building AI models, detailing steps like data collection from sources like DrugBank and PubChem, data preprocessing, and modeling methods including machine learning and deep learning. It also covers evaluation metrics like accuracy and regression scores.</alt-text>
</graphic>
</fig>
<p>To develop such models, a systematic workflow is essential, typically consisting of four key stages: data collection, data preprocessing, model development, and evaluation (<xref ref-type="fig" rid="F1">Figure 1B</xref>). The first step involves gathering drug toxicity data from a variety of sources. These data sources, including both public databases and proprietary collections, provide extensive information on chemical structures, bioactivity, and associated toxicity profiles, forming a rich foundation for supervised learning (<xref ref-type="bibr" rid="B91">Pognan et al., 2023</xref>). Once the data is collected, preprocessing is carried out to transform raw experimental results into formats suitable for machine learning. This includes handling missing values, standardizing molecular representations (e.g., SMILES strings or molecular graphs), and performing feature engineering such as calculating molecular descriptors (e.g., molecular weight, clogP, number of rotatable bonds) (<xref ref-type="bibr" rid="B119">Wigh et al., 2022</xref>). Toxicity labels are also encoded appropriately. These steps ensure data consistency and help extract informative features for training predictive models. The next stage involves selecting and training appropriate modeling techniques. Depending on the data structure and task complexity, a variety of algorithms can be applied, including Random Forest, XGBoost, Support Vector Machines (SVMs), neural networks, as well as more recent approaches such as Graph Neural Networks (GNNs). GNNs align well with the graph-based nature of molecular structures, which contributes to their strong predictive performance in various molecular property prediction tasks (<xref ref-type="bibr" rid="B50">Jiang et al., 2021</xref>; <xref ref-type="bibr" rid="B95">Reiser et al., 2022</xref>). In addition, they facilitate the identification of substructures or motifs associated with specific biological effects, thereby enhancing both the accuracy and interpretability of toxicity prediction models (<xref ref-type="bibr" rid="B50">Jiang et al., 2021</xref>; <xref ref-type="bibr" rid="B95">Reiser et al., 2022</xref>; <xref ref-type="bibr" rid="B123">Wu Z. X. et al., 2023</xref>). Transformer-based models, originally developed for natural language processing, have also shown strong potential in cheminformatics (<xref ref-type="bibr" rid="B102">Schwaller et al., 2019</xref>; <xref ref-type="bibr" rid="B108">Tibo et al., 2024</xref>).</p>
<p>In the evaluation phase, performance metrics are selected based on the type of prediction task. For classification models, metrics such as accuracy, precision, recall, F1-score, and area under ROC curve (AUROC) are used to evaluate the model&#x2019;s ability to correctly distinguish toxic from non-toxic compounds. For regression models that predict continuous values like LD<sub>50</sub> or IC<sub>50</sub>, commonly used metrics include MSE, RMSE, MAE, and <italic>R</italic>
<sup>2</sup>. In addition to these quantitative measures, interpretability techniques such as SHAP or attention-based visualizations can provide insights into the features driving model predictions, supporting both model validation and decision-making in drug development (<xref ref-type="bibr" rid="B99">Rodr&#xed;guez-P&#xe9;rez and Bajorath, 2020</xref>; <xref ref-type="bibr" rid="B116">Wang Y. M. et al., 2023</xref>).</p>
<p>Driven by the growing need for early toxicity screening, advances in AI model architectures, and the emergence of robust development frameworks, a number of AI-based toxicity prediction models have recently been proposed. These models vary in scope and specificity, often categorized based on the target organ or the type of assay data used for training. This review summarizes representative toxicity prediction models that cover a broad range of toxicological endpoints. In particular, it focuses on models developed for ADMET profiling, hepatotoxicity, cardiotoxicity, neurotoxicity, and mutagenicity/genotoxicity prediction. Each category reflects distinct biological concerns and methodological approaches. Model development within these domains has evolved in response to challenges such as data scarcity, protocol heterogeneity, and class imbalance (<xref ref-type="bibr" rid="B14">Cavasotto and Scardino, 2022</xref>; <xref ref-type="bibr" rid="B70">Liu et al., 2023</xref>). To address these issues, various strategies have been employed, including multi-task learning, multimodal integration, and active learning. These strategies are discussed in more detail in later sections. In addition, scaffold-based data splitting is also commonly used to evaluate model generalizability across novel chemical structures while minimizing data leakage. In summarizing these models, this review also highlights differences in data sources, input representations, model architectures, and evaluation strategies and interpretability techniques used across toxicity endpoints. These aspects reflect how AI models are tailored to meet the distinct challenges of each toxicological domain.</p>
</sec>
<sec id="s2">
<title>2 Benchmark datasets</title>
<p>A wide range of publicly available datasets have been developed to support toxicity prediction using machine learning and deep learning approaches (<xref ref-type="table" rid="T1">Table 1</xref>). Among the most widely used is Tox21, which comprises qualitative toxicity measurements of 8,249 compounds across 12 biological targets, primarily focused on nuclear receptor and stress response pathways (<xref ref-type="bibr" rid="B97">Richard et al., 2021</xref>). A related resource, ToxCast provides high-throughput screening data for approximately 4,746 chemicals tested across hundreds of biological endpoints, offering broad mechanistic coverage for <italic>in vitro</italic> toxicity profiling (<xref ref-type="bibr" rid="B98">Richard et al., 2016</xref>). These datasets are frequently employed as benchmarks for evaluating classification models in predictive toxicology.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Summary of publicly available benchmark datasets for toxicity prediction.</p>
</caption>
<table>
<thead valign="top">
<tr style="background-color:#D9D9D9">
<th align="left">Dataset Name</th>
<th align="left">Task Type</th>
<th align="left">Description</th>
<th align="left">Ref.</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Tox21SL</td>
<td align="left">Binary Classification</td>
<td align="left">Predicts toxicity across 12 biological targets using qualitative measurements (based on the EPA CompTox Dashboard)</td>
<td align="left">
<xref ref-type="bibr" rid="B97">Richard et al. (2021)</xref>
</td>
</tr>
<tr>
<td align="left">ToxCast</td>
<td align="left">Binary Classification</td>
<td align="left">Provides high-throughput screening (HTS) data across hundreds of assays to evaluate the potential toxicity of chemicals (based on the EPA CompTox Dashboard)</td>
<td align="left">
<xref ref-type="bibr" rid="B98">Richard et al. (2016)</xref>
</td>
</tr>
<tr>
<td align="left">ClinTox</td>
<td align="left">Binary Classification</td>
<td align="left">Predicts clinical trial toxicity outcomes, distinguishing between approved and failed drugs</td>
<td align="left">
<xref ref-type="bibr" rid="B36">Gayvert et al. (2016)</xref>
</td>
</tr>
<tr>
<td align="left">hERG (<xref ref-type="bibr" rid="B51">Karim et al., 2021</xref>)</td>
<td align="left">Binary Classification</td>
<td align="left">Integrated dataset predicting hERG channel blockade (&#x3c;10&#xa0;&#xb5;M) or not (&#x2265;10&#xa0;&#xb5;M)</td>
<td align="left">
<xref ref-type="bibr" rid="B51">Karim et al. (2021)</xref>
</td>
</tr>
<tr>
<td align="left">hERG blockers</td>
<td align="left">Binary Classification</td>
<td align="left">Predicts if a compound blocks the hERG channel, which is crucial for heart rhythm</td>
<td align="left">
<xref ref-type="bibr" rid="B114">Wang et al. (2016)</xref>
</td>
</tr>
<tr>
<td align="left">hERG Central</td>
<td align="left">Binary &#x26; Regression</td>
<td align="left">Provides multiple assays: hERG_at_1uM, hERG_at_10uM (regression), and hERG_inhib (classification)</td>
<td align="left">
<xref ref-type="bibr" rid="B27">Du et al. (2011)</xref>
</td>
</tr>
<tr>
<td align="left">DILIrank</td>
<td align="left">Binary Classification</td>
<td align="left">Predicts drug-induced liver injury, a common cause of drug withdrawal</td>
<td align="left">
<xref ref-type="bibr" rid="B19">Chen et al. (2016)</xref>
</td>
</tr>
<tr>
<td align="left">SIDER</td>
<td align="left">Multi-label</td>
<td align="left">Predicts clinical adverse drug reactions associated with marketed drugs</td>
<td align="left">
<xref ref-type="bibr" rid="B60">Kuhn et al. (2016)</xref>
</td>
</tr>
<tr>
<td align="left">Skin Reaction</td>
<td align="left">Binary Classification</td>
<td align="left">Predicts if a compound can cause skin sensitization reactions</td>
<td align="left">
<xref ref-type="bibr" rid="B3">Alves et al. (2015)</xref>
</td>
</tr>
<tr>
<td align="left">AMES (<xref ref-type="bibr" rid="B124">Xu et al., 2012</xref>)</td>
<td align="left">Binary Classification</td>
<td align="left">Predicts mutagenicity based on the Ames test, indicating potential genetic alterations</td>
<td align="left">
<xref ref-type="bibr" rid="B124">Xu et al. (2012)</xref>
</td>
</tr>
<tr>
<td align="left">Carcinogens (<xref ref-type="bibr" rid="B61">Lagunin et al., 2009</xref>)</td>
<td align="left">Binary Classification</td>
<td align="left">Predicts if a compound is carcinogenic</td>
<td align="left">
<xref ref-type="bibr" rid="B61">Lagunin et al. (2009)</xref>
</td>
</tr>
<tr>
<td align="left">LD50 (<xref ref-type="bibr" rid="B140">Zhu et al., 2009</xref>)</td>
<td align="left">Regression</td>
<td align="left">Predicts acute toxicity (LD50) values, indicating lethal dose levels</td>
<td align="left">
<xref ref-type="bibr" rid="B140">Zhu et al. (2009)</xref>
</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>To assess clinical toxicity risks, the ClinTox dataset offers labeled data differentiating compounds that were approved by regulatory agencies from those that failed in clinical trials due to toxicity (<xref ref-type="bibr" rid="B36">Gayvert et al., 2016</xref>). Several datasets have been curated for evaluating cardiotoxicity associated with the human Ether-&#xe0;-go-go&#x2013;related gene (hERG) channel blockade. The hERG dataset (<xref ref-type="bibr" rid="B114">Wang et al., 2016</xref>; <xref ref-type="bibr" rid="B51">Karim et al., 2021</xref>) includes over 13,000 compounds annotated with binary labels based on a 10&#xa0;&#xb5;M inhibition threshold, while the hERG blockers dataset provides a smaller set of 648 compounds (<xref ref-type="bibr" rid="B114">Wang et al., 2016</xref>; <xref ref-type="bibr" rid="B51">Karim et al., 2021</xref>). A more extensive resource, hERG Central, encompasses over 300,000 experimental records and supports both classification and regression tasks based on various hERG inhibition assays (<xref ref-type="bibr" rid="B27">Du et al., 2011</xref>). Liver toxicity is addressed in the DILIrank (Drug-Induced Liver Injury) dataset, which contains 475 compounds annotated for their hepatotoxic potential, an important factor in post-market drug withdrawals (<xref ref-type="bibr" rid="B128">Xu et al., 2015</xref>). The SIDER dataset presents multi-label side effect annotations for more than 1,400 marketed drugs, enabling the prediction of clinically observed adverse drug reactions (<xref ref-type="bibr" rid="B60">Kuhn et al., 2016</xref>). For dermatological toxicity, the Skin Reaction dataset includes 404 compounds evaluated for their potential to cause skin sensitization (<xref ref-type="bibr" rid="B3">Alves et al., 2015</xref>). Genotoxicity is commonly assessed using the AMES dataset, which comprises 7,255 compounds labeled based on the Ames test&#x2014;a standard assay for detecting mutagenic potential (<xref ref-type="bibr" rid="B124">Xu et al., 2012</xref>). The Carcinogens dataset contains 278 compounds classified as carcinogenic or non-carcinogenic, serving as a benchmark for cancer risk prediction (<xref ref-type="bibr" rid="B61">Lagunin et al., 2009</xref>). Finally, acute systemic toxicity is represented by the LD<sub>50</sub>_Zhu dataset, which includes LD<sub>50</sub> values for 7,385 compounds and supports regression modeling of lethal dose responses (<xref ref-type="bibr" rid="B140">Zhu et al., 2009</xref>). Collectively, these datasets span a broad range of toxicological endpoints and data modalities and have become foundational resources for the development, validation, and comparison of AI-driven toxicity prediction models.</p>
<p>At the same time, their widespread adoption has revealed several practical challenges that impact real-world applications. For instance, data scarcity in certain toxicity endpoints can hinder the performance of machine learning models that depend on sufficient training data. In some cases, limited data may fail to represent diverse chemical scaffolds, reducing model generalizability. When class imbalance is also present, such as a higher proportion of non-toxic compounds, the effects of data scarcity can be further amplified (<xref ref-type="bibr" rid="B14">Cavasotto and Scardino, 2022</xref>). Since toxicity labels are typically derived from experimental measurements, inconsistencies across assay protocols often lead to a lack of data uniformity. This protocol heterogeneity can make it difficult to merge datasets from different sources. Furthermore, annotation noise resulting from experimental variability or ambiguous labeling can introduce additional challenges during model training (<xref ref-type="bibr" rid="B70">Liu et al., 2023</xref>).</p>
<p>To overcome these issues, expanding datasets through newly generated experimental data and literature-based curation can help improve coverage and diversity. In parallel, standardizing toxicity testing protocols and documentation practices may enhance data consistency and interoperability. These efforts are expected to contribute meaningfully to the development of more robust and reliable AI-based toxicity prediction models in drug discovery.</p>
</sec>
<sec id="s3">
<title>3 Computational models for ADMET and toxicity prediction</title>
<p>Several publicly accessible ADMET prediction tools, including ADMETLab 3.0, Deep-PK, ProTox 3.0, Helix-ADMET, FP-ADMET, and admetSAR 2.0 (<xref ref-type="bibr" rid="B130">Yang et al., 2019</xref>; <xref ref-type="bibr" rid="B111">Venkatraman, 2021</xref>; <xref ref-type="bibr" rid="B136">Zhang et al., 2022</xref>; <xref ref-type="bibr" rid="B7">Banerjee et al., 2024</xref>; <xref ref-type="bibr" rid="B33">Fu et al., 2024</xref>; <xref ref-type="bibr" rid="B83">Myung et al., 2024</xref>), provide a wide array of toxicity prediction models, each differing in scope, algorithmic strategy, and coverage. ADMETLab 3.0 offers predictive models for 119 endpoints, including toxicity-related properties such as hERG inhibition, carcinogenicity, and respiratory toxicity. These models are built using directed message-passing neural networks (DMPNNs) and incorporate uncertainty estimation features. The toxicity models, such as the one for hERG inhibition, have demonstrated strong performance with AUROC values approaching 0.94. In terms of interpretability, ADMETLab 3.0 provides uncertainty scores alongside predictions, uses colored indicators to represent empirical decision states, and highlights structural alerts contributing to toxicity (<xref ref-type="bibr" rid="B33">Fu et al., 2024</xref>). Deep-PK is a deep learning&#x2013;based framework that predicts 73 endpoints, including 35 toxicity-related endpoints, 29 other ADMET properties, and 9 general molecular descriptors. While its primary focus lies in pharmacokinetic regression tasks and ADMET optimization, it offers comprehensive support for toxicity assessment through GNN-based pipelines that accept SMILES, SDF, and molecular descriptor inputs. The model also provides interpretability by identifying key molecular subgraphs that contribute to prediction outcomes (<xref ref-type="bibr" rid="B83">Myung et al., 2024</xref>). ProTox 3.0 is particularly comprehensive in its treatment of toxicity, providing 61 predictive models covering a broad spectrum of endpoints. These include organ-specific toxicities such as hepatotoxicity, neurotoxicity, cardiotoxicity, and nephrotoxicity, along with models for clinical, immunological, and nutritional toxicities. The platform integrates mechanistic insights through AOPs, molecular initiating events, and target-specific toxicities, and supports ontology-driven, systems-level interpretation (<xref ref-type="bibr" rid="B7">Banerjee et al., 2024</xref>). Helix-ADMET is a flexible ADMET prediction platform that combines self-supervised and multi-task learning to enhance generalizability across diverse chemical scaffolds. It supports fine-tuning on user-defined endpoints and classifies toxicity into macro- and micro-level categories (<xref ref-type="bibr" rid="B136">Zhang et al., 2022</xref>). FP-ADMET is an open-source tool that focuses on over 50 ADMET-related endpoints, including drug-induced liver injury, hERG inhibition, hemolytic toxicity, mitochondrial toxicity, and cell-specific cytotoxicity. The models are constructed using random forest classifiers trained on 20 different types of chemical fingerprints, enabling broad chemical space coverage and compound exploration (<xref ref-type="bibr" rid="B111">Venkatraman, 2021</xref>). admetSAR 2.0 provides 47 curated endpoints, including Ames mutagenicity, carcinogenicity, immunotoxicity, and hERG inhibition. It employs traditional machine learning algorithms such as random forest, SVM, and k-nearest neighbors (KNNs) applied to molecular descriptors and fingerprints (<xref ref-type="bibr" rid="B130">Yang et al., 2019</xref>).</p>
<p>The comprehensiveness of these tools not only facilitates broad ADMET screening but also enables prioritization of drug candidates with favorable safety profiles. The development of such general-purpose prediction tools has been largely driven by advances in molecular representations that effectively capture compound features, along with the availability of benchmark datasets annotated with a wide range of ADMET endpoints. On the other hand, tools that focus on specific toxicity types such as hepatotoxicity, cardiotoxicity, nephrotoxicity, neurotoxicity, and genotoxicity/carcinogenicity often require task-specific datasets and tailored feature engineering strategies to enhance predictive performance. The following sections introduce these organ- and mechanism-specific toxicity models and discuss how specialized data and domain-informed approaches contribute to their effectiveness.</p>
</sec>
<sec id="s4">
<title>4 Endpoint-specific toxicity prediction</title>
<p>Each endpoint is characterized by differences in data properties, sources including databases, and overall data volume. Furthermore, depending on the specific toxicity pathways involved, areas of interest such as the level of interpretability required can also vary. As a result, models for each endpoint have been designed to reflect these unique characteristics, leading to differences in the features used and the methodological approaches adopted (<xref ref-type="fig" rid="F2">Figure 2</xref> and <xref ref-type="table" rid="T2">Table 2</xref>). While many of these models share a common foundation in molecular data, it is important to note that the choice of features and modeling techniques is often tailored to the distinct goals and nature of each endpoint.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Representative toxicity endpoints categorized into six major classes.</p>
</caption>
<graphic xlink:href="fchem-13-1632046-g002.tif">
<alt-text content-type="machine-generated">Chart with six sections detailing types of drug-induced toxicity: ADMET, Hepatotoxicity, Cardiotoxicity, Nephrotoxicity, Neurotoxicity, and Genotoxicity. Each section lists specific tests and effects, such as LD50, cytotoxicity, and liver enzyme elevation.</alt-text>
</graphic>
</fig>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Summary comparison table across different toxicity endpoints.</p>
</caption>
<table>
<thead valign="top">
<tr style="background-color:#D9D9D9">
<th align="left">Endpoint</th>
<th align="left">Data</th>
<th align="left">Feature<xref ref-type="table-fn" rid="Tfn1">
<sup>a</sup>
</xref>
</th>
<th align="left">Methods<xref ref-type="table-fn" rid="Tfn1">
<sup>a</sup>
</xref>
</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Hepatotoxicity</td>
<td align="left">DILIrank (<xref ref-type="bibr" rid="B19">Chen et al., 2016</xref>)<break/>DILIst (<xref ref-type="bibr" rid="B107">Thakkar et al., 2020</xref>)<break/>LiverTox (<xref ref-type="bibr" rid="B45">Hoofnagle et al., 2013</xref>), Hepatox (<xref ref-type="bibr" rid="B92">Quinton et al., 1993</xref>)<break/>Proxy-DILI (<xref ref-type="bibr" rid="B81">Mulliner et al., 2016</xref>)<break/>SIDER (<xref ref-type="bibr" rid="B60">Kuhn et al., 2016</xref>)<break/>LTKB (<xref ref-type="bibr" rid="B20">Chen et al., 2011</xref>)<break/>
<xref ref-type="bibr" rid="B40">Greene et al. (2010)</xref>
<break/>
<xref ref-type="bibr" rid="B126">Xu et al. (2008)</xref>
<break/>
<xref ref-type="bibr" rid="B69">Liew et al. (2011)</xref>
<break/>
<xref ref-type="bibr" rid="B129">Yan et al. (2022)</xref>
</td>
<td align="left">Molecular structure<break/>&#x2003;- Molecular graph<break/>&#x2003;- Molecule image<break/>&#x2003;- Molecular fingerprints (e.g., ECFP, MACCS keys)<break/>Descriptors<break/>&#x2003;- Molecular descriptors (e.g., PaDEL)<break/>&#x2003;- Physicochemical descriptors<break/>Task-specific or specialized features<break/>&#x2003;- Predicted PK parameters<break/>&#x2003;- Predicted Proxy-DILI labels</td>
<td align="left">Deep learning models<break/>&#x2003;- GeoGNN &#x2b; ResNet<break/>&#x2003;- ResNet<break/>&#x2003;- Fully connected neural network (FCNN)<break/>Tree-based Models<break/>- Random forest<break/>- Light gradient boosting machine (LGBM)<break/>- Decision trees<break/>Bayesian models<break/>- Bayesian network</td>
</tr>
<tr>
<td align="left">Cardiotoxicity</td>
<td align="left">ChEMBL (<xref ref-type="bibr" rid="B35">Gaulton et al., 2017</xref>), BindingDB (<xref ref-type="bibr" rid="B73">Liu et al., 2007</xref>)<break/>PubChem (<xref ref-type="bibr" rid="B53">Kim et al., 2016</xref>)<break/>
<xref ref-type="bibr" rid="B24">Didziapetris and Lanevskij (2016)</xref>
<break/>
<xref ref-type="bibr" rid="B114">Wang et al. (2016)</xref>
<break/>
<xref ref-type="bibr" rid="B72">Liu et al. (2020)</xref>
<break/>
<xref ref-type="bibr" rid="B66">Li et al. (2008)</xref>
<break/>
<xref ref-type="bibr" rid="B82">Munawar et al. (2019)</xref>
<break/>
<xref ref-type="bibr" rid="B84">Negami et al. (2019)</xref>
<break/>
<xref ref-type="bibr" rid="B62">Lanevskij et al. (2022)</xref>
<break/>
<xref ref-type="bibr" rid="B100">Ryu et al. (2020)</xref>
<break/>
<xref ref-type="bibr" rid="B51">Karim et al. (2021)</xref>
<break/>
<xref ref-type="bibr" rid="B137">Zhang Y. M. et al. (2019)</xref>
<break/>
<xref ref-type="bibr" rid="B52">Kim et al. (2022)</xref>
<break/>
<xref ref-type="bibr" rid="B55">Konda and Kristam (2019)</xref>
<break/>
<xref ref-type="bibr" rid="B13">Cai et al. (2019)</xref>
<break/>
<xref ref-type="bibr" rid="B26">Doddareddy et al. (2010)</xref>
</td>
<td align="left">Molecular structure<break/>&#x2003;- Molecular fingerprints<break/>&#x2003;- AtomPairs2DFingerprintCount (APC2D)<break/>&#x2003;- SMILES embedding vector<break/>Descriptors<break/>&#x2003;- Molecular descriptors (Mordred, AlvaDesc)<break/>&#x2003;- 2D &#x2b; 3D descriptors (Mordred)</td>
<td align="left">Deep learning models<break/>&#x2003;- GNN (Attentive FP)<break/>&#x2003;- Graph attention networks (GAT) &#x2b; Gated recurrent units (GRU)<break/>&#x2003;- GAT<break/>&#x2003;- FCNN<break/>&#x2003;- GCN<break/>&#x2003;- Meta-ensemble model combining GCN, FCNN, and 1D&#x2003;- Convolutional neural network (CNN)<break/>Tree-based Models<break/>- XGBoost</td>
</tr>
<tr>
<td align="left">Renal/nephrotoxicity</td>
<td align="left">SIDER (<xref ref-type="bibr" rid="B60">Kuhn et al., 2016</xref>)<break/>DrugBank (<xref ref-type="bibr" rid="B120">Wishart et al., 2018</xref>)<break/>ChEMBL (<xref ref-type="bibr" rid="B35">Gaulton et al., 2017</xref>)<break/>PubChem (<xref ref-type="bibr" rid="B53">Kim et al., 2016</xref>)<break/>TCM (<xref ref-type="bibr" rid="B16">Chen, 2011</xref>)<break/>ChemIDplus</td>
<td align="left">Molecular structure<break/>&#x2003;- Molecular fingerprints (Morgan, EstateFP, CDK FP, CDK extended FP, CDK graph&#x2003;-only FP, Klekota&#x2013;Roth FP, MACCS keys, PubChem FP, Substructure FP)<break/>- APC2D<break/>- Fragmentor<break/>- SMILES embedding vector<break/>Descriptors<break/>- Molecular descriptors (Chemaxon, Mordred, RDKit, QNPR, alvaDesc, PyDescriptor, GSFrag)</td>
<td align="left">Deep learning models<break/>&#x2003;- CNN<break/>&#x2003;- FCNN<break/>Tree-based models<break/>&#x2003;- Random forest<break/>&#x2003;- LGBM<break/>&#x2003;- XGBoost<break/>SVM<break/>Ensemble/hybrid models<break/>&#x2003;- Combination of genetic algorithm and Na&#xef;ve Bayes classifier<break/>- Consensus model of random forest, XGBoost, and CNN</td>
</tr>
<tr>
<td align="left">Neurotoxicity</td>
<td align="left">PubChem (<xref ref-type="bibr" rid="B53">Kim et al., 2016</xref>)<break/>ChEMBL database (<xref ref-type="bibr" rid="B35">Gaulton et al., 2017</xref>)<break/>U.S. EPA dataset (<xref ref-type="bibr" rid="B2">Albert, 1994</xref>)<break/>SIDER (<xref ref-type="bibr" rid="B60">Kuhn et al., 2016</xref>)<break/>
<xref ref-type="bibr" rid="B71">Liu et al. (2021)</xref>
<break/>
<xref ref-type="bibr" rid="B79">Mazumdar et al. (2023)</xref>
<break/>
<xref ref-type="bibr" rid="B106">Tang et al. (2022)</xref>
<break/>
<xref ref-type="bibr" rid="B105">Storchi et al. (2023)</xref>
<break/>ChemIDplus</td>
<td align="left">Molecular structure<break/>&#x2003;- Molecular graph<break/>&#x2003;- SMILES embedding<break/>&#x2003;- Molecular fingerprints (e.g., ECFP, MACCS keys, PubChem FP, substructure FP, Klekota&#x2013;Roth FP, Estate FP, CDK FP, CDK ECFP)<break/>Descriptors<break/>- Molecular descriptors (e.g., PaDEL, CDK, Dragon descriptors)<break/>Task-specific or specialized features<break/>- MIE predictions</td>
<td align="left">Deep learning models<break/>&#x2003;- DMPNN<break/>&#x2003;- MFBERT<break/>&#x2003;- MLP&#x2003;-NNET<break/>Tree-based Models<break/>&#x2003;- Random forest<break/>&#x2003;- Extra&#x2003;-trees regressor<break/>&#x2003;- C4.5 decision tree<break/>SVM<break/>kNN<break/>Na&#xef;ve Bayes</td>
</tr>
<tr>
<td align="left">Genotoxicity/Carcinogenicity</td>
<td align="left">TOXRIC (<xref ref-type="bibr" rid="B122">Wu W. X. et al., 2023</xref>)<break/>Li&#x2019;s dataset (<xref ref-type="bibr" rid="B68">Li T. et al., 2021</xref>)<break/>
<xref ref-type="bibr" rid="B124">Xu et al. (2012)</xref>
<break/>
<xref ref-type="bibr" rid="B42">Hansen et al. (2009)</xref>
<break/>
<xref ref-type="bibr" rid="B10">Benigni et al. (2013)</xref>
<break/>
<xref ref-type="bibr" rid="B25">Dimitrov et al. (2016)</xref>
<break/>CPDB (<xref ref-type="bibr" rid="B38">Gold et al., 2005</xref>)<break/>CCRIS database, ISSCAN (<xref ref-type="bibr" rid="B11">Benigni et al., 2008</xref>)</td>
<td align="left">Molecular structure<break/>&#x2003;- Molecular fingerprints (e.g., ECFP2, ECFP4, ECFP6, MACCS keys, PubChem FP, CDK FP, CDK extended FP, Klekota&#x2013;Roth FP, AP2D, AP2DC, Estate FP, FP4, FP4C)<break/>- Mol2vec<break/>Descriptors<break/>- Molecular descriptors (e.g., RDKit2D, computed molecular descriptors)<break/>Task-specific or specialized features<break/>&#x2003;- Structural alerts</td>
<td align="left">Deep Learning Models<break/>&#x2003;- 2D-CNN with active learning<break/>&#x2003;- Capsule network with self&#x2003;-attention routing<break/>- Multitask DNN<break/>Tree-based Models<break/>- Extremely randomized trees<break/>SVM<break/>Ensemble/hybrid models<break/>- Consensus model (averaging)<break/>- Recursive molecular similarity &#x2b; extremely randomized trees</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="Tfn1">
<label>
<sup>a</sup>
</label>
<p>Features and methods refer to those used in the reviewed models; additional options may be applicable.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>In hepatotoxicity prediction, physicochemical properties of molecules are known to be influential and are often incorporated into models (<xref ref-type="bibr" rid="B17">Chen et al., 2013a</xref>; <xref ref-type="bibr" rid="B57">Kotsampasakou and Ecker, 2017</xref>; <xref ref-type="bibr" rid="B64">Lee and Yoo, 2024</xref>). Both deep learning and tree-based methods have been used with comparable frequency. For cardiotoxicity, particularly related to hERG channel blockade, the availability of larger datasets has encouraged the use of more data-intensive deep learning approaches. GNNs are frequently applied due to their structural compatibility with molecules and their ability to offer interpretability through substructure-level attention (<xref ref-type="bibr" rid="B50">Jiang et al., 2021</xref>; <xref ref-type="bibr" rid="B132">Yang et al., 2024</xref>; <xref ref-type="bibr" rid="B63">Lee and Yoo, 2025</xref>). In renal or nephrotoxicity prediction, traditional machine learning models are more commonly used, as they tend to perform better than deep learning when data are limited (<xref ref-type="bibr" rid="B127">Xu et al., 2023</xref>). In neurotoxicity studies, a single study may develop multiple models to address distinct tasks such as BBB permeability, neuronal cytotoxicity, neural activity interference, and general neurotoxicity, enabling broader predictive coverage (<xref ref-type="bibr" rid="B88">Pang et al., 2025</xref>). For genotoxicity and carcinogenicity, multi-task learning has been applied to predict outcomes across several Ames test strains within a single model. This approach outperformed single-task models by leveraging shared parameters across tasks (<xref ref-type="bibr" rid="B77">Mart&#xed;nez et al., 2022</xref>). These variations, driven by endpoint-specific requirements, are elaborated in the subsequent sections.</p>
<sec id="s4-1">
<title>4.1 Hepatotoxicity</title>
<p>The physiological functions of the liver, a fundamental organ in maintaining systemic homeostasis, include detoxification, plasma protein synthesis, regulation of lipid and glucose metabolism, bile production, and immune modulation (<xref ref-type="bibr" rid="B41">Gu and Manautou, 2012</xref>). While the liver&#x2019;s metabolic processes can render many chemicals less toxic, it has the potential to enhance their toxicity as well, thereby exerting a detrimental effect on the liver (<xref ref-type="bibr" rid="B41">Gu and Manautou, 2012</xref>). Pathologies of the liver, such as hepatic steatosis and fibrosis, can adversely impact the metabolism of nutrients, endocrine substances and pharmaceuticals resulting in pronounced systemic implications for overall physiological homeostasis (<xref ref-type="bibr" rid="B31">Foulds et al., 2017</xref>; <xref ref-type="bibr" rid="B43">Heeren and Scheja, 2021</xref>). Due to its multifaceted physiological roles and vulnerability to chemical-induced damage, the liver frequently experiences drug toxicity. Consequently, it becomes imperative to accurately assess the hepatotoxicity of drugs, commonly referred to as drug-induced liver injury (DILI), an area of active research (<xref ref-type="bibr" rid="B94">Regev, 2014</xref>). Both <italic>in vitro</italic> and <italic>in vivo</italic> methods are employed to evaluate the hepatotoxicity of drugs, although these approaches can be laborious and costly (<xref ref-type="bibr" rid="B1">Ai et al., 2018</xref>; <xref ref-type="bibr" rid="B113">Walker et al., 2020</xref>). Moreover, the level of agreement between liver toxicity in animals and humans averages approximately 55% (<xref ref-type="bibr" rid="B6">Babai et al., 2021</xref>). Consequently, there exists a demand for predictive models that can foresee liver toxicity and help mitigate development risk and late-stage failure.</p>
<p>Various machine learning approaches have been proposed to address the limitations of traditional DILI assessment, particularly in terms of scalability and interpretability (<xref ref-type="table" rid="T3">Table 3</xref>). InterDILI focused on enhancing interpretability by employing permutation feature importance and attention mechanisms to identify both general and compound-specific substructures and physicochemical properties contributing to DILI, using five publicly available datasets and multiple machine learning algorithms (<xref ref-type="bibr" rid="B64">Lee and Yoo, 2024</xref>). DILIPredictor employed a two-stage modeling approach by integrating proxy-DILI labels with chemical structure features. By identifying the most contributing MACCS substructures to DILI toxicity, it further provided insights into species-specific hepatotoxicity and mechanistic causes through substructure interpretation. The model also provides a web interface for easy access to DILI predictions and their interpretation without the need for local installation (<xref ref-type="bibr" rid="B23">Seal et al., 2024</xref>). GeoDILI introduced an interpretable graph neural network that leverages 3D molecular geometry and gradient-based attribution to identify atom-level toxicophores, addressing the lack of geometric and mechanistic considerations in previous models (<xref ref-type="bibr" rid="B122">Wu W. X. et al., 2023</xref>). It encodes molecular structures using a fine-tuned geometry-based GNN (GeoGNN), with the resulting vector passed through a ResNet for binary DILI classification. Notably, it applies to a rare attention-free interpretation method for GNNs, offering an alternative to attention-based approaches. OvA-QSTR utilized a one-vs-all classification strategy based on PaDEL-derived molecular descriptors and feature selection via correlation heatmaps, aiming to isolate DILI-related features with statistical clarity (<xref ref-type="bibr" rid="B15">Celik and Karaduman, 2023</xref>). The model proposed by Rao et al. predicted DILI severity by integrating physicochemical descriptors with off-target profiles, highlighting the importance of drug-target interactions and promiscuity in distinguishing between different levels of hepatotoxicity (<xref ref-type="bibr" rid="B93">Rao et al., 2023</xref>). Lastly, ResNet18DNN converted SMILES codes into molecular images and applied deep neural networks to learn abstract chemical features from visual input, offering a novel image-based perspective in DILI prediction (<xref ref-type="bibr" rid="B21">Chen et al., 2022</xref>).</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Summary of recently published prediction tools of DILI.</p>
</caption>
<table>
<thead valign="top">
<tr style="background-color:#D9D9D9">
<th align="left">Approach</th>
<th align="left">Year</th>
<th align="left">Dataset</th>
<th align="left">Features</th>
<th align="left">Algorithm</th>
<th align="left">Performance</th>
<th align="left">Ref.</th>
<th align="left">Availability</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">InterDILI</td>
<td align="left">2024</td>
<td align="left">FDA NCTR (<xref ref-type="bibr" rid="B18">Chen et al., 2013b</xref>)<break/>
<xref ref-type="bibr" rid="B40">Greene et al. (2010)</xref>
<break/>
<xref ref-type="bibr" rid="B126">Xu et al. (2008)</xref>
<break/>
<xref ref-type="bibr" rid="B69">Liew et al. (2011)</xref>
<break/>DILIrank (<xref ref-type="bibr" rid="B19">Chen et al., 2016</xref>)</td>
<td align="left">Morgan fingerprints,<break/>Physicochemical descriptors (RDKit)</td>
<td align="left">Random forest,<break/>LGBM,<break/>Logistic regression (LR),<break/>FCNN</td>
<td align="left">DILI prediction [Hold-out]<break/>- AUROC: 0.97<break/>- AUPRC: 0.95<break/>- ACC: 0.90 <break/>[10-fold CV]<break/>- AUROC: 0.87<break/>- ACC: 0.78<break/>- AUPRC: 0.87</td>
<td align="left">
<xref ref-type="bibr" rid="B64">Lee and Yoo (2024)</xref>
</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://github.com/bmil-jnu/InterDILI">https://github.com/bmil-jnu/InterDILI</ext-link>
</td>
</tr>
<tr>
<td align="left">DILI Predictor</td>
<td align="left">2024</td>
<td align="left">DILIst (<xref ref-type="bibr" rid="B107">Thakkar et al., 2020</xref>)<break/>DILIrank (<xref ref-type="bibr" rid="B19">Chen et al., 2016</xref>)<break/>Proxy-DILI (<xref ref-type="bibr" rid="B81">Mulliner et al., 2016</xref>)</td>
<td align="left">Morgan fingerprints,<break/>MACCS keys,<break/>Physicochemical descriptors (RDKit),<break/>Predicted PK parameters,<break/>Predicted proxy-DILI labels</td>
<td align="left">Random forest</td>
<td align="left">DILI prediction<break/>- AUROC: 0.63<break/>- LR<sup>&#x2b;</sup>: 1.40</td>
<td align="left">
<xref ref-type="bibr" rid="B23">Seal et al. (2024)</xref>
</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://dili.serve.scilifelab.se/">https://dili.serve.scilifelab.se/</ext-link>
<break/>
<ext-link ext-link-type="uri" xlink:href="https://github.com/srijitseal/DILI_Predictor?tab=readme-ov-file">https://github.com/srijitseal/DILI_Predictor?tab&#x3d;readme-ov-file</ext-link>
</td>
</tr>
<tr>
<td align="left">GeoDILI</td>
<td align="left">2023</td>
<td align="left">DILIst (<xref ref-type="bibr" rid="B107">Thakkar et al., 2020</xref>)<break/>DILIrank (<xref ref-type="bibr" rid="B19">Chen et al., 2016</xref>)<break/>
<xref ref-type="bibr" rid="B129">Yan et al. (2022)</xref>
</td>
<td align="left">Molecular graph</td>
<td align="left">GeoGNN &#x2b; ResNet</td>
<td align="left">DILI prediction<break/>- AUROC: 0.908<break/>- ACC: 0.975<break/>- F1-score: 0.905<break/>- MCC: 0.732</td>
<td align="left">
<xref ref-type="bibr" rid="B122">Wu W. X. et al. (2023)</xref>
</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://github.com/CSU-QJY/GeoDILI">https://github.com/CSU-QJY/GeoDILI</ext-link>
</td>
</tr>
<tr>
<td align="left">OvA-QSTR</td>
<td align="left">2023</td>
<td align="left">LiverTox (<xref ref-type="bibr" rid="B45">Hoofnagle et al., 2013</xref>), PubChem (<xref ref-type="bibr" rid="B53">Kim et al., 2016</xref>)</td>
<td align="left">Molecular descriptors (PaDEL)</td>
<td align="left">Bayesian network, Decision trees,<break/>Random forest</td>
<td align="left">DILI prediction<break/>BayesNet<break/>- AUPRC: 0.718 to 0.869</td>
<td align="left">
<xref ref-type="bibr" rid="B15">Celik and Karaduman (2023)</xref>
</td>
<td align="left"/>
</tr>
<tr>
<td align="left">Rao et al.</td>
<td align="left">2023</td>
<td align="left">DILIrank (<xref ref-type="bibr" rid="B19">Chen et al., 2016</xref>)</td>
<td align="left">Physicochemical descriptors (RDKit &#x2b; QikProp)</td>
<td align="left">Random forest, SVM, FCNN, LR</td>
<td align="left">DILI prediction<break/>- AUROC: 0.88<break/>- Sensitivity: 0.73<break/>- Specificity: 0.9</td>
<td align="left">
<xref ref-type="bibr" rid="B93">Rao et al. (2023)</xref>
</td>
<td align="left"/>
</tr>
<tr>
<td align="left">ResNet18DNN</td>
<td align="left">2022</td>
<td align="left">DILIrank (<xref ref-type="bibr" rid="B19">Chen et al., 2016</xref>), LiverTox (<xref ref-type="bibr" rid="B45">Hoofnagle et al., 2013</xref>), Hepatox (<xref ref-type="bibr" rid="B92">Quinton et al., 1993</xref>)<break/>SIDER (<xref ref-type="bibr" rid="B60">Kuhn et al., 2016</xref>), LTKB (<xref ref-type="bibr" rid="B20">Chen et al., 2011</xref>), Literature (<xref ref-type="bibr" rid="B18">Chen et al., 2013b</xref>; <xref ref-type="bibr" rid="B128">Xu et al., 2015</xref>)</td>
<td align="left">Smiles converted in images by RDKit</td>
<td align="left">ResNet</td>
<td align="left">DILI prediction<break/>- AUROC: 0.958</td>
<td align="left">
<xref ref-type="bibr" rid="B21">Chen et al. (2022)</xref>
</td>
<td align="left"/>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s4-2">
<title>4.2 Cardiotoxicity prediction</title>
<p>Cardiotoxicity is a major concern in drug development, often leading to late-stage failures or market withdrawals. Compounds posing cardiovascular risks have been withdrawn, while others face increasing regulatory scrutiny, underscoring the need for early risk assessment strategies. An illustrative case involves Janus kinase (JAK) inhibitors, namely, tofacitinib, baricitinib, and upadacitinib, used to treat rheumatoid arthritis. In 2021, the U.S. FDA issued a boxed warning for these agents due to elevated risks of cardiovascular events, malignancies, thrombosis, and mortality (<xref ref-type="bibr" rid="B58">Kragstrup et al., 2022</xref>). Such examples highlight the importance of identifying cardiotoxic compounds early in the drug discovery process. A common mechanism of cardiotoxicity involves QT interval prolongation and ventricular arrhythmias, often resulting from inhibition of the hERG potassium channel, which is critical for cardiac repolarization (<xref ref-type="bibr" rid="B131">Yang et al., 2020</xref>). To mitigate these risks, evaluation of hERG liability is required at the preclinical stage per ICH S7B guidelines (<xref ref-type="bibr" rid="B29">FDA, 2005</xref>), and is increasingly recommended during earlier stages, including lead optimization. Early identification enables structural refinement to avoid cardiotoxicity before costly development steps.</p>
<p>Several recently developed computational tools for cardiotoxicity prediction are summarized in <xref ref-type="table" rid="T4">Table 4</xref>, with a particular focus on assessing hERG channel blockade&#x2014;a critical concern in early drug development. hERGBoost presents a quantitative modeling approach using gradient boosting to predict IC<sub>50</sub> values of potential hERG inhibitors, allowing a more nuanced evaluation of cardiotoxic risk beyond binary classification. Although the model is easily accessible through a web interface, it does not provide interpretability for its predictions (<xref ref-type="bibr" rid="B134">Yu et al., 2025</xref>). The following models, though not web-accessible, are designed to provide interpretability. hERGAT employs a hybrid architecture combining GAT and GRU to capture both atomic-level and molecule-level interactions, enhancing interpretability through attention-based substructure identification (<xref ref-type="bibr" rid="B63">Lee and Yoo, 2025</xref>). AttenhERG incorporates uncertainty estimation within a graph neural network framework, aiming to improve the reliability of predictions and assist compound optimization. It provides interpretability through atom-level attention weight visualizations, highlighting which molecular substructures contribute to hERG inhibition (<xref ref-type="bibr" rid="B132">Yang et al., 2024</xref>). DMFGAM integrates both fingerprint-derived and graph-based features using a SMILES graph attention network and fully connected neural layers, reflecting the advantage of multimodal input representations (<xref ref-type="bibr" rid="B115">Wang T. Y. et al., 2023</xref>). CardioTox Net utilizes a meta-ensemble strategy that merges outputs from multiple deep learning architectures (GCN, FCNN, 1D-CNN), each trained on diverse molecular encodings, to enhance prediction robustness across varying datasets and evaluation criteria (<xref ref-type="bibr" rid="B51">Karim et al., 2021</xref>). Lastly, DeepHIT focuses on minimizing false negatives by training multiple deep neural networks on a large gold-standard dataset, and includes a chemical transformation module for generating safer analogs based on known cardiotoxic compounds (<xref ref-type="bibr" rid="B100">Ryu et al., 2020</xref>).</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Recently published prediction tools of cardiotoxicity.</p>
</caption>
<table>
<thead valign="top">
<tr style="background-color:#D9D9D9">
<th align="left">Approach</th>
<th align="left">Year</th>
<th align="left">Dataset</th>
<th align="left">Features</th>
<th align="left">Algorithm</th>
<th align="left">Performance</th>
<th align="left">Ref.</th>
<th align="left">Availability</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">hERGBoost</td>
<td align="left">2025</td>
<td align="left">ChEMBL (<xref ref-type="bibr" rid="B35">Gaulton et al., 2017</xref>)<break/>BindingDB (<xref ref-type="bibr" rid="B73">Liu et al., 2007</xref>)<break/>
<xref ref-type="bibr" rid="B24">Didziapetris and Lanevskij (2016)</xref>
<break/>
<xref ref-type="bibr" rid="B114">Wang et al. (2016)</xref>
<break/>
<xref ref-type="bibr" rid="B72">Liu et al. (2020)</xref>
<break/>
<xref ref-type="bibr" rid="B66">Li et al. (2008)</xref>
<break/>
<xref ref-type="bibr" rid="B82">Munawar et al. (2019)</xref>
<break/>
<xref ref-type="bibr" rid="B84">Negami et al. (2019)</xref>
<break/>
<xref ref-type="bibr" rid="B62">Lanevskij et al. (2022)</xref>
<break/>
<xref ref-type="bibr" rid="B100">Ryu et al. (2020)</xref>
<break/>
<xref ref-type="bibr" rid="B51">Karim et al. (2021)</xref>
</td>
<td align="left">Descriptors (AlvaDesc),<break/>Molecular fingerprints</td>
<td align="left">XGBoost</td>
<td align="left">hERG channel inhibition<break/>[Regression]<break/>- <italic>R</italic>
<sup>2</sup>: 0.622<break/>- RMSE: 0.595<break/>- MAE: 0.383<break/>[Classification]<break/>- ACC: 0.814<break/>- MCC: 0.614</td>
<td align="left">
<xref ref-type="bibr" rid="B134">Yu et al. (2025)</xref>
</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="http://ssbio.cau.ac.kr/software/hergboost/">http://ssbio.cau.ac.kr/software/hergboost/</ext-link>
</td>
</tr>
<tr>
<td align="left">hERGAT</td>
<td align="left">2025</td>
<td align="left">ChEMBL (<xref ref-type="bibr" rid="B35">Gaulton et al., 2017</xref>)<break/>PubChem (<xref ref-type="bibr" rid="B53">Kim et al., 2016</xref>)<break/>
<xref ref-type="bibr" rid="B66">Li et al. (2008)</xref>
<break/>
<xref ref-type="bibr" rid="B114">Wang et al. (2016)</xref>
<break/>
<xref ref-type="bibr" rid="B135">Zhang H. et al. (2019)</xref>
<break/>
<xref ref-type="bibr" rid="B52">Kim et al. (2022)</xref>
</td>
<td align="left">Descriptors,<break/>Molecular fingerprints,<break/>Molecular graph</td>
<td align="left">GAT &#x2b; GRU</td>
<td align="left">hERG channel inhibition<break/>- AUROC: 0.907<break/>- AUPRC: 0.904</td>
<td align="left">
<xref ref-type="bibr" rid="B63">Lee and Yoo (2025)</xref>
</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://github.com/bmil-jnu/hERGAT">https://github.com/bmil-jnu/hERGAT</ext-link>
</td>
</tr>
<tr>
<td align="left">AttenhERG</td>
<td align="left">2024</td>
<td align="left">ChEMBL (<xref ref-type="bibr" rid="B35">Gaulton et al., 2017</xref>), PubChem (<xref ref-type="bibr" rid="B53">Kim et al., 2016</xref>), BindingDB (<xref ref-type="bibr" rid="B73">Liu et al., 2007</xref>)<break/>
<xref ref-type="bibr" rid="B52">Kim et al. (2022)</xref>
</td>
<td align="left">Molecular graph</td>
<td align="left">GNN (Attentive FP)</td>
<td align="left">hERG channel inhibition<break/>- AUROC: 0.835<break/>- BAC: 0.767<break/>- MCC: 0.543</td>
<td align="left">
<xref ref-type="bibr" rid="B132">Yang et al. (2024)</xref>
</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://github.com/Tianbiao-Yang/AttenhERG">https://github.com/Tianbiao-Yang/AttenhERG</ext-link>
</td>
</tr>
<tr>
<td align="left">DMFGAM</td>
<td align="left">2023</td>
<td align="left">CHEMBL (<xref ref-type="bibr" rid="B35">Gaulton et al., 2017</xref>)<break/>
<xref ref-type="bibr" rid="B72">Liu et al. (2020)</xref>
<break/>
<xref ref-type="bibr" rid="B55">Konda and Kristam (2019)</xref>
<break/>
<xref ref-type="bibr" rid="B82">Munawar et al. (2019)</xref>
<break/>
<xref ref-type="bibr" rid="B84">Negami et al. (2019)</xref>
</td>
<td align="left">Morgan fingerprints (ECFP2)<break/>AtomPairs2DFingerprintCount (APC2D)</td>
<td align="left">SMILES graph attention network (SGAT),<break/>FCNN</td>
<td align="left">hERG channel inhibition<break/>- AUROC: 0.894<break/>- ACC: 0.817<break/>- MCC: 0.630<break/>- Sensitivity: 0.847</td>
<td align="left">
<xref ref-type="bibr" rid="B116">Wang Y. M. et al. (2023)</xref>
</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://github.com/zhaoqi106/DMFGAM">https://github.com/zhaoqi106/DMFGAM</ext-link>
</td>
</tr>
<tr>
<td align="left">CardioTox net</td>
<td align="left">2021</td>
<td align="left">BindingDB (<xref ref-type="bibr" rid="B73">Liu et al., 2007</xref>)<break/>ChEMBL (<xref ref-type="bibr" rid="B35">Gaulton et al., 2017</xref>)<break/>
<xref ref-type="bibr" rid="B13">Cai et al. (2019)</xref>
<break/>
<xref ref-type="bibr" rid="B24">Didziapetris and Lanevskij (2016)</xref>
<break/>
<xref ref-type="bibr" rid="B26">Doddareddy et al. (2010)</xref>
</td>
<td align="left">Molecular graph,<break/>Morgan fingerprints (ECFP2),<break/>2D&#x2b;3D Descriptors (Mordred),<break/>SMILES embedding vector,<break/>Fingerprint embedding vector</td>
<td align="left">meta-ensemble combining,<break/>GCN,<break/>FCNN and<break/>1D-CNN</td>
<td align="left">hERG channel inhibition <break/>[Test set-I]<break/>- ACC: 0.810<break/>- BAC: 0.810<break/>- MCC: 0.599<break/>Sensitivity: 0.833 <break/>[Test set-II]<break/>- ACC: 0.755<break/>- BAC: 0.754<break/>- MCC: 0.452<break/>- Sensitivity: 0.909 <break/>[Test set-III]<break/>- ACC: 0.746<break/>- BAC: 0.746<break/>- MCC: 0.220<break/>- Sensitivity: 0.794</td>
<td align="left">
<xref ref-type="bibr" rid="B51">Karim et al. (2021)</xref>
</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://github.com/Abdulk084/CardioTox">https://github.com/Abdulk084/CardioTox</ext-link>
</td>
</tr>
<tr>
<td align="left">DeepHIT</td>
<td align="left">2020</td>
<td align="left">BindingDB (<xref ref-type="bibr" rid="B73">Liu et al., 2007</xref>)<break/>ChEMBL (<xref ref-type="bibr" rid="B35">Gaulton et al., 2017</xref>)<break/>
<xref ref-type="bibr" rid="B13">Cai et al. (2019)</xref>
<break/>
<xref ref-type="bibr" rid="B24">Didziapetris and Lanevskij (2016)</xref>
<break/>
<xref ref-type="bibr" rid="B26">Doddareddy et al. (2010)</xref>
<break/>In-house dataset</td>
<td align="left">Molecular Fingerprints (PyBioMed),<break/>Descriptors (Mordred),<break/>Molecular Graph</td>
<td align="left">GCN,<break/>FCNN</td>
<td align="left">hERG channel inhibition<break/>- ACC: 0.773<break/>- Sensitivity: 0.833<break/>- BAC: 0.738<break/>- MCC: 0.476</td>
<td align="left">
<xref ref-type="bibr" rid="B100">Ryu et al. (2020)</xref>
</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://academic.oup.com/bioinformatics/article/36/10/3049/5727757">https://academic.oup.com/bioinformatics/article/36/10/3049/5727757</ext-link>
</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s4-3">
<title>4.3 Renal/nephrotoxicity prediction</title>
<p>The kidneys are vital excretory organs that maintain homeostasis by producing urine, eliminating waste, and regulating water, electrolytes, and acid&#x2013;base balance. During renal clearance, pharmaceutical compounds undergo filtration, reabsorption, and secretion, contributing to their metabolism and excretion (<xref ref-type="bibr" rid="B39">Gong et al., 2022</xref>). However, this process also increases the kidneys&#x2019; exposure to potentially harmful substances, giving rise to drug-induced nephrotoxicity (DIN). The prevalence of DIN in the adult population has been reported to range from 14% to 26% (<xref ref-type="bibr" rid="B103">Shi et al., 2022</xref>). Drug-induced renal failure accounts for approximately 25% of acute kidney injury (AKI) cases in hospitalized patients, with aminoglycoside antibiotics, NSAIDs, contrast agents, and angiotensin-converting enzyme inhibitors (ACEi) among the most common causative drugs (<xref ref-type="bibr" rid="B37">Ghane Shahrbaf and Assadi, 2015</xref>; <xref ref-type="bibr" rid="B39">Gong et al., 2022</xref>). The underlying mechanisms of DIN are multifactorial, involving damage to tubular epithelial cells, ureteral obstruction, interstitial nephritis, and disruption of intra-glomerular hemodynamics (<xref ref-type="bibr" rid="B103">Shi et al., 2022</xref>).</p>
<p>Assessing DIN risk remains challenging due to the vast diversity of pharmaceutical agents with nephrotoxic potential. Many compounds, beyond the commonly recognized nephrotoxic drugs, can elicit kidney injury through distinct mechanisms and at varying sites within the renal architecture (<xref ref-type="bibr" rid="B103">Shi et al., 2022</xref>). These include selective damage to proximal or distal tubules, glomeruli, or the renal interstitium, depending on the drug&#x2019;s chemical properties, metabolites, and mechanisms of accumulation or transport within renal tissues. Given these complexities, traditional toxicological methods remain indispensable; however, they are often impractical for efficiently screening large number of compounds in the early stages of drug development. As a result, computational approaches that integrate diverse molecular features are increasingly recognized as valuable tools for the early identification of nephrotoxic risk (<xref ref-type="table" rid="T5">Table 5</xref>).</p>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>Recent examples of nephrotoxicity prediction tools.</p>
</caption>
<table>
<thead valign="top">
<tr style="background-color:#D9D9D9">
<th align="left">Approach</th>
<th align="left">Year</th>
<th align="left">Dataset</th>
<th align="left">Features</th>
<th align="left">Algorithm</th>
<th align="left">Performance</th>
<th align="left">Ref.</th>
<th align="left">Availability</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Gong et al.</td>
<td align="left">2022</td>
<td align="left">SIDER (<xref ref-type="bibr" rid="B60">Kuhn et al., 2016</xref>), DrugBank (<xref ref-type="bibr" rid="B120">Wishart et al., 2018</xref>), ChEMBL (<xref ref-type="bibr" rid="B35">Gaulton et al., 2017</xref>)<break/>TCM (<xref ref-type="bibr" rid="B16">Chen, 2011</xref>)</td>
<td align="left">Atom Pair 2D, fingerprint, Estate FP,<break/>CDK extended FP,<break/>CDK FP,<break/>CDK graph only FP, Klekota&#x2013;Roth FP,<break/>MACCS keys,<break/>PubChem FP, substructure FP</td>
<td align="left">FCNN, LGBM,<break/>SVM</td>
<td align="left">DIN prediction <break/>[Herbal Medicines (Test set-I)]<break/>- ANN_PubChemFP<break/>- AUROC: 0.911<break/>- ACC: 0.867<break/>- MCC: 0.740<break/>- SVM_GraphFP<break/>- AUROC:0.902<break/>- ACC: 0.867<break/>- MCC: 0.761 <break/>[Chemical Medicines (Test set-II)]<break/>- LGBM _KRFP<break/>- AUROC:0.896<break/>- ACC: 0.861<break/>- MCC: 0.721<break/>- SVM_GraphFP<break/>- AUROC:0.894<break/>- ACC: 0.814<break/>- MCC: 0.629<break/>[Mixed Medicines (Test set-III)]<break/>- SVM_GraphFP<break/>- AUROC:0.915<break/>- ACC: 0.857<break/>- MCC: 0.723<break/>- ANN_PubChemFP<break/>- AUROC:0.903<break/>- ACC: 0.857<break/>- MCC: 0.718</td>
<td align="left">
<xref ref-type="bibr" rid="B39">Gong et al. (2022)</xref>
</td>
<td align="left"/>
</tr>
<tr>
<td align="left">Shi et al.</td>
<td align="left">2022</td>
<td align="left">SIDER (<xref ref-type="bibr" rid="B60">Kuhn et al., 2016</xref>), Pubchem (<xref ref-type="bibr" rid="B53">Kim et al., 2016</xref>)</td>
<td align="left">Chemaxon descriptors, Fragmentor,<break/>GSFrag descriptors, Mordred descriptors, PyDescriptor,<break/>QNPR descriptors,<break/>RDKit descriptors, alvaDesc descriptors</td>
<td align="left">Consensus model of random forest<break/>XGBoost<break/>CNN</td>
<td align="left">DIN prediction<break/>- AUROC: 0.93<break/>- MCC: 0.72<break/>- Accuracy (Q): 0.86<break/>- Sensitivity: 0.85<break/>- Specificity: 0.87<break/>- Enrichment Factor (EF): 1.72</td>
<td align="left">
<xref ref-type="bibr" rid="B103">Shi et al. (2022)</xref>
</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="http://www.sapredictor.cn/">http://www.sapredictor.cn/</ext-link>
</td>
</tr>
<tr>
<td align="left">Zhang et al.</td>
<td align="left">2019</td>
<td align="left">ChemIDplus</td>
<td align="left">Morgan fingerprints (ECFP6),<break/>Molecular descriptors</td>
<td align="left">Na&#xef;ve Bayes classifier,<break/>Genetic algorithm</td>
<td align="left">Chemical-induced urinary tract toxicity<break/>- ACC: 0.84</td>
<td align="left">
<xref ref-type="bibr" rid="B137">Zhang Y. M et al. (2019)</xref>
</td>
<td align="left"/>
</tr>
</tbody>
</table>
</table-wrap>
<p>The predictive model proposed by Gong et al. (<xref ref-type="bibr" rid="B39">Gong et al., 2022</xref>) was developed by utilizing the technique of fingerprinting chemical drugs and Chinese herbal medicines. This model aimed to provide a comprehensive prediction of nephrotoxicity. On the other hand, Shi et al. (<xref ref-type="bibr" rid="B103">Shi et al., 2022</xref>) developed a nephrotoxicity prediction model based on physicochemical property analysis. Among the approaches tested, the model utilizing QNPR descriptors with a random forest algorithm achieved the highest accuracy of 87.16%. Notably, the consensus model outperformed individual models, attaining a superior AUROC of 0.93. The model is accessible via a web interface and provides interpretability by identifying structural alerts associated with nephrotoxicity, using f-score and positive rate analysis of each fragment derived from KRFP fingerprints. Lastly, Zhang et al. (<xref ref-type="bibr" rid="B135">Zhang H. et al., 2019</xref>) categorized molecular features based on factors such as the number of nitrogen atoms, AlogP, molecular weight, hydrogen bond acceptors and donors, and fractional polar surface area. Among the evaluated algorithms, the Na&#xef;ve Bayes classifier demonstrated superior performance and was ultimately selected for nephrotoxicity prediction.</p>
</sec>
<sec id="s4-4">
<title>4.4 Neurotoxicity prediction</title>
<p>Neurotoxicity refers to the toxicity that affects both central and peripheral nervous systems leading to their impaired function and structure (<xref ref-type="bibr" rid="B65">Legradi et al., 2018</xref>). The mechanisms of neurotoxicity are broadly categorized into neuronopathy, axonopathy, myelinopathy, and neurotransmission-associated toxicity (<xref ref-type="bibr" rid="B109">Valentine, 2020</xref>; <xref ref-type="bibr" rid="B54">Kocot-Kepska et al., 2021</xref>). Even therapeutic drugs can exhibit neurotoxic effects; for instance, vincristine, a plant-derived chemotherapeutic alkaloid, is known to cause peripheral neuropathy, which manifests as numbness, tingling, and motor weakness. Given these risks, it is essential to screen for neurotoxicity during drug development to ensure the safety of new chemical entities. To this end, the OECD Test Guidelines 418, 419, and 424 are internationally recognized as standard protocols for assessing neurotoxic effects. However, these <italic>in vivo</italic> testing methods are time-consuming, costly, and reliant on animal use. Consequently, there is a growing demand for faster and more efficient <italic>in silico</italic> approaches to complement traditional testing methods in predicting neurotoxicity (<xref ref-type="bibr" rid="B49">Jiang et al., 2020</xref>).</p>
<p>In response to this need, several computational models have recently been developed to improve the prediction of neurotoxicity (<xref ref-type="table" rid="T6">Table 6</xref>). NeuTox 2.0 employs a hybrid deep learning framework that integrates molecular fingerprints, descriptors, and GNNs through multimodal feature fusion. It was trained on four neurotoxicity-related datasets and demonstrated strong generalizability and robustness, enabling its use in large-scale chemical screening. This design allows the model to predict various facets of neurotoxicity, offering a broader perspective on neurotoxic effects. However, since all input features are derived from the same molecular structure, the model&#x2019;s multimodal nature is limited in scope (<xref ref-type="bibr" rid="B88">Pang et al., 2025</xref>). DINeuroTpredictor is a web-based model built on clinical neurotoxicity data using multiple machine learning algorithms and molecular fingerprints. It also provides insights into key physicochemical features and structural alerts associated with neurotoxic potential (<xref ref-type="bibr" rid="B138">Zhao et al., 2022</xref>). Gadaleta et al. proposed a QSAR-based approach linked to AOPs, modeling molecular initiating events to support mechanistic neurotoxicity prediction (<xref ref-type="bibr" rid="B34">Gadaleta et al., 2022</xref>). Lastly, Jiang et al. developed regression models using PyBioMed descriptors and ensemble learning methods, focusing on chemical diversity and model applicability domains to enhance prediction reliability (<xref ref-type="bibr" rid="B49">Jiang et al., 2020</xref>).</p>
<table-wrap id="T6" position="float">
<label>TABLE 6</label>
<caption>
<p>Recent examples of neurotoxicity prediction tools.</p>
</caption>
<table>
<thead valign="top">
<tr style="background-color:#D9D9D9">
<th align="left">Approach</th>
<th align="left">Year</th>
<th align="left">Dataset</th>
<th align="left">Features</th>
<th align="left">Algorithm</th>
<th align="left">Performance</th>
<th align="left">Ref.</th>
<th align="left">Availability</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">NeuTox 2.0</td>
<td align="left">2025</td>
<td align="left">PubChem Bioassay database (<xref ref-type="bibr" rid="B53">Kim et al., 2016</xref>)<break/>ChEMBL database (<xref ref-type="bibr" rid="B35">Gaulton et al., 2017</xref>)<break/>U.S. EPA dataset (<xref ref-type="bibr" rid="B2">Albert, 1994</xref>)<break/>SIDER (<xref ref-type="bibr" rid="B60">Kuhn et al., 2016</xref>)<break/>
<xref ref-type="bibr" rid="B71">Liu et al. (2021)</xref>, <xref ref-type="bibr" rid="B79">Mazumdar et al. (2023)</xref>
<break/>
<xref ref-type="bibr" rid="B106">Tang et al. (2022)</xref>
<break/>
<xref ref-type="bibr" rid="B105">Storchi et al. (2023)</xref>
</td>
<td align="left">Molecular graph,<break/>Molecular fingerprint (ECFP),<break/>Molecular descriptor (Padel)</td>
<td align="left">DMPNN,<break/>MFBERT</td>
<td align="left">Blood&#x2013;Brain Barrier Penetration<break/>- AUROC: 0.9708<break/>- ACC: 0.9120<break/>- MCC: 0.8157<break/>- F1 Score: 0.9274<break/>Neuronal Cytotoxicity<break/>- AUROC: 0.9637<break/>- ACC: 0.9093<break/>- MCC: 0.8171<break/>- F1 Score: 0.8969<break/>Neural Activity Interference<break/>- AUROC: 0.8509<break/>- ACC: 0.8007<break/>- MCC: 0.5292<break/>- F1 Score: 0.6651<break/>Neurotoxicity<break/>- AUROC: 0.8297<break/>- ACC: 0.7945<break/>- MCC: 0.5140<break/>- F1 Score: 0.8539</td>
<td align="left">
<xref ref-type="bibr" rid="B88">Pang et al. (2025)</xref>
</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://github.com/xuejunhe/NeuTox-2.0">https://github.com/xuejunhe/NeuTox-2.0</ext-link>
</td>
</tr>
<tr>
<td align="left">DINeuro Tpredictor</td>
<td align="left">2022</td>
<td align="left">SIDER (<xref ref-type="bibr" rid="B60">Kuhn et al., 2016</xref>), PubChem (<xref ref-type="bibr" rid="B53">Kim et al., 2016</xref>)</td>
<td align="left">Estate FP, CDK FP, CDK ECFP,<break/>Klekota&#x2013;Roth FP,<break/>MACCS keys,<break/>PubChem FP, substructure FP</td>
<td align="left">Random Forest,<break/>SVM,<break/>C4.5 decision, tree, kNN,<break/>Na&#xef;ve Bayes</td>
<td align="left">Neurotoxicity<break/>5-fold CV<break/>- AUROC: 0.83<break/>- BAC: 0.7651<break/>- MCC: 0.52</td>
<td align="left">
<xref ref-type="bibr" rid="B138">Zhao et al. (2022)</xref>
</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="http://dineurot.sapredictor.cn/">http://dineurot.sapredictor.cn/</ext-link>
</td>
</tr>
<tr>
<td align="left">
<xref ref-type="bibr" rid="B34">Gadaleta et al. (2022)</xref>
</td>
<td align="left">2022</td>
<td align="left">ChEMBL (<xref ref-type="bibr" rid="B53">Kim et al., 2016</xref>), Literature (<xref ref-type="bibr" rid="B56">Kosnik et al., 2020</xref>)</td>
<td align="left">MIE predictions, Dragon descriptors,<break/>ECFP</td>
<td align="left">Random forest, kNN,<break/>MLP-NNET</td>
<td align="left">Neurotoxicity<break/>- AUROC: 0.91<break/>- MCC: 0.66</td>
<td align="left">
<xref ref-type="bibr" rid="B34">Gadaleta et al. (2022)</xref>
</td>
<td align="left"/>
</tr>
<tr>
<td align="left">
<xref ref-type="bibr" rid="B49">Jiang et al. (2020)</xref>
</td>
<td align="left">2020</td>
<td align="left">ChemIDplus</td>
<td align="left">MATSp2, bcutv10, MRVSA5, GATSe2, Rpc, EstateVSA1, Geto, Smax15, MTPSA, bcute2, J, Chiv10, Chiv9, mChi1, Smin8, Hy, Smin32, MATSv3, MATSe3, MACCS keys</td>
<td align="left">Extra-trees regressor</td>
<td align="left">Autonomic Neurotoxicity (pLD<sub>50</sub>)<break/>- q<sup>2</sup>: 0.784<break/>- RMSE: 0.201<break/>- MAE: 0.159</td>
<td align="left">
<xref ref-type="bibr" rid="B49">Jiang et al. (2020)</xref>
</td>
<td align="left"/>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s4-5">
<title>4.5 Genotoxicity/carcinogenicity</title>
<p>Genotoxicity is defined as the capacity of deleterious agents to induce harm to the genetic material within cells (<xref ref-type="bibr" rid="B96">Ren et al., 2017</xref>). Mutagenicity pertains to the capacity of a substance to induce alterations in genetic material, which could potentially instigate diverse ailments, such as cancer (<xref ref-type="bibr" rid="B30">Ferguson, 2010</xref>; <xref ref-type="bibr" rid="B9">Basu, 2018</xref>). Carcinogenicity is the potential of a compound to cause cancer (<xref ref-type="bibr" rid="B101">Schrenk, 2018</xref>). These three concepts, i.e., genotoxicity, mutagenicity, and carcinogenicity, exhibit a strong correlation due to the fact that substances that possess genotoxic properties frequently result in mutations, and these mutations can induce the development of cancer (<xref ref-type="bibr" rid="B8">Barnes et al., 2018</xref>; <xref ref-type="bibr" rid="B85">Nohmi, 2018</xref>). Given the fact that cancer is one of the most prominent reasons contributing to mortality on a global scale, it becomes imperative to thoroughly scrutinize the plausible factors that give rise to this ailment. Unlike other forms of toxicity, carcinogenicity is distinct in that it does not exhibit a threshold in the assessment of dose-response. This phenomenon arises from the fact that a lone anomaly through interactions with DNA, instigated by a specific compound, can yield a protracted consequence and engender the formation of neoplastic growth (<xref ref-type="bibr" rid="B85">Nohmi, 2018</xref>). Numerous principles are established in light of this, particularly the guidelines of S1B(R1) (<xref ref-type="bibr" rid="B47">ICH, 2022</xref>), S2 (R1) (<xref ref-type="bibr" rid="B46">ICH, 2020</xref>), and M7 (R1) (<xref ref-type="bibr" rid="B48">ICH, 2023</xref>) outlined by the ICH. The course of action typically takes 2&#xa0;years and involves around 500 rodents, making it a rigorous, time-consuming, and resource-intensive task (<xref ref-type="bibr" rid="B68">Li T. et al., 2021</xref>). Furthermore, the test&#x2019;s complexity depends on whether it is analyzing the genetic, DNA, or chromosomal level, and whether it is intended for somatic or germline cells (<xref ref-type="bibr" rid="B96">Ren et al., 2017</xref>). Due to these obstacles, there is a growing demand for AI-assisted prediction to overcome these challenges.</p>
<p>Currently available AI prediction tools of mutagenicity and genotoxicity are summarized in <xref ref-type="table" rid="T7">Table 7</xref> muTOX-AL proposed a deep active learning framework to address the challenge of limited labeled data in mutagenicity prediction. By actively selecting the most informative molecules from a vast chemical space and presenting them for annotation, the model significantly reduces the number of training samples required. It also demonstrates strong discriminative power by identifying structurally similar molecules with opposing mutagenic properties (<xref ref-type="bibr" rid="B125">Xu et al., 2024</xref>). Fournier et al. introduced a model capable of predicting genotoxicity across various assays, including Ames test results, chromosomal aberrations, and gene mutations, thereby expanding the scope of genotoxicity evaluation. Despite its broad predictive scope, the model introduced by Fournier et al. does not provide executable tools or source code, limiting its immediate applicability and reproducibility (<xref ref-type="bibr" rid="B32">Fournier et al., 2023</xref>). DCAMCP employed a self-attention routing capsule network to improve generalizability while reducing the number of trainable parameters, demonstrating balanced performance across multiple evaluation metrics (<xref ref-type="bibr" rid="B22">Chen et al., 2023</xref>). Shinada et al. constructed a model using descriptors derived from density functional theory (DFT). Although its performance was modest, the study highlighted opportunities to improve computational approaches (<xref ref-type="bibr" rid="B104">Shinada et al., 2022</xref>). Mart&#xed;nez et al. developed the first predictive model based on Ames test standards (OECD TA98, TA100, TA1535, TA1537, and TA102), setting a precedent for mutagenicity prediction using standardized experimental protocols. The multi-task learning framework with shared parameters enabled information transfer across tasks, improving mutagenicity prediction for each strain (<xref ref-type="bibr" rid="B77">Mart&#xed;nez et al., 2022</xref>).</p>
<table-wrap id="T7" position="float">
<label>TABLE 7</label>
<caption>
<p>Recent examples of Genotoxicity/carcinogenicity prediction tools.</p>
</caption>
<table>
<thead valign="top">
<tr style="background-color:#D9D9D9">
<th align="left">Approach</th>
<th align="left">Year</th>
<th align="left">Dataset</th>
<th align="left">Features</th>
<th align="left">Algorithm</th>
<th align="left">Performance</th>
<th align="left">Ref.</th>
<th align="left">Availability</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">muTOX-AL</td>
<td align="left">2024</td>
<td align="left">TOXRIC (<xref ref-type="bibr" rid="B123">Wu Z. X. et al., 2023</xref>)<break/>Li&#x2019;s dataset (<xref ref-type="bibr" rid="B67">Li S. M. et al., 2021</xref>)</td>
<td align="left">Molecular fingerprints (ECFP2, ECFP4, ECFP6)<break/>MACCS keys<break/>Molecular descriptors (RDkit2D)</td>
<td align="left">2D-CNN<break/>Active learning</td>
<td align="left">Mutagenicity (Ames test)<break/>Full training (5,988 samples)<break/>- AUROC: 0.9093<break/>- ACC: 0.8476<break/>- F1 Score: 0.8383<break/>- Recall: 0.8350<break/>Active learning (1,438 samples)<break/>&#x2212; 95% of the full-model accuracy using 1,438 samples (&#x223c;24% of the training data)</td>
<td align="left">
<xref ref-type="bibr" rid="B125">Xu et al. (2024)</xref>
</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://github.com/Felicityxuhy/muTOX-AL">https://github.com/Felicityxuhy/muTOX-AL</ext-link>
</td>
</tr>
<tr>
<td align="left">
<xref ref-type="bibr" rid="B32">Fournier et al. (2023)</xref>
</td>
<td align="left">2023</td>
<td align="left">
<xref ref-type="bibr" rid="B124">Xu et al. (2012)</xref>
<break/>
<xref ref-type="bibr" rid="B42">Hansen et al. (2009)</xref>
<break/>
<xref ref-type="bibr" rid="B10">Benigni et al. (2013)</xref>
<break/>
<xref ref-type="bibr" rid="B25">Dimitrov et al. (2016)</xref>
</td>
<td align="left">2D descriptors<break/>MACCS keys</td>
<td align="left">Recursive molecular similarity, Extremely randomized trees</td>
<td align="left">Mutagenicity (Ames test)<break/>- AUROC: 0.9208 chromosomal abnormalities<break/>- AUROC: 0.9191 mammalian cell gene mutation test<break/>- AUROC: 0.9722</td>
<td align="left">
<xref ref-type="bibr" rid="B32">Fournier et al. (2023)</xref>
</td>
<td align="left"/>
</tr>
<tr>
<td align="left">DCAMCP</td>
<td align="left">2023</td>
<td align="left">CPDB (<xref ref-type="bibr" rid="B38">Gold et al., 2005</xref>), CCRIS database, ISSCAN (<xref ref-type="bibr" rid="B11">Benigni et al., 2008</xref>)</td>
<td align="left">Various molecular fingerprints<break/>MACCS keys<break/>PubChem FP<break/>CDK FP<break/>CDK extended FP<break/>Klekota-Roth FP<break/>AP2D<break/>Klekota-Roth count<break/>AP2DC<break/>Substructure (FP4)<break/>Substructure count (FP4C)<break/>Estate FP</td>
<td align="left">A capsule network with a self-attention routing algorithm</td>
<td align="left">Carcinogenicity<break/>- AUROC: 0.793<break/>- ACC: 0.718<break/>- Sensitivity: 0.721<break/>- Specificity: 0.715</td>
<td align="left">
<xref ref-type="bibr" rid="B22">Chen et al. (2023)</xref>
</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://github.com/zhaoqi106/DCAMCP">https://github.com/zhaoqi106/DCAMCP</ext-link>
</td>
</tr>
<tr>
<td align="left">
<xref ref-type="bibr" rid="B104">Shinada et al. (2022)</xref>
</td>
<td align="left">2022</td>
<td align="left">
<xref ref-type="bibr" rid="B42">Hansen et al. (2009)</xref>
</td>
<td align="left">MACCS, ECFP, Mol2vec, Computed molecular descriptors, structural alerts relevant to mutagenicity, DFT-based descriptors</td>
<td align="left">SVM</td>
<td align="left">Mutagenicity (Ames test)<break/>AUROC: 0.926</td>
<td align="left">
<xref ref-type="bibr" rid="B104">Shinada et al. (2022)</xref>
</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://bitbucket.org/sbx-publication/enhanced_representation_mutagenicity/src/master/">https://bitbucket.org/sbx-publication/enhanced_representation_mutagenicity/src/master/</ext-link>
</td>
</tr>
<tr>
<td align="left">
<xref ref-type="bibr" rid="B77">Mart&#xed;nez et al. (2022)</xref>
</td>
<td align="left">2022</td>
<td align="left">ISSSTY v1-a database (<xref ref-type="bibr" rid="B10">Benigni et al., 2013</xref>)</td>
<td align="left">0D, 1D, and 2D molecular descriptors</td>
<td align="left">Multitask-FCNN<break/>Consensus model (averaging)</td>
<td align="left">Mutagenicity (Ames test)<break/>Balanced ACC: 0.93<break/>MCC: 0.89<break/>H1 Score: 0.92<break/>Specificity: 0.86<break/>Sensitivity: 0.99</td>
<td align="left">
<xref ref-type="bibr" rid="B77">Mart&#xed;nez et al. (2022)</xref>
</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://github.com/VirSabando/MTL_DNN_Ames">https://github.com/VirSabando/MTL_DNN_Ames</ext-link>
</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="s5">
<title>5 Emerging AI innovations in toxicity prediction</title>
<p>As previously discussed, AI model design is significantly affected by both the characteristics and the volume of data available for training. In the context of toxicity prediction for drug discovery, input data typically comprises molecular structures, physicochemical properties, and task-specific features. However, these tasks are often constrained by the limited availability of labeled data. To address this challenge, a variety of data-efficient learning strategies have been developed to maximize predictive performance under label-scarce conditions.</p>
<p>In data-scarce settings, transfer learning strategies use pre-trained parameters to boost toxicity prediction performance. For instance, HelixADMET employs a three-stage training framework that incorporates self-supervised pretraining on large-scale unlabeled molecular data, followed by multi-task and fine-tuning stages to transfer learned chemical knowledge to various ADMET endpoints, significantly improving extrapolation to novel chemical scaffolds (<xref ref-type="bibr" rid="B136">Zhang et al., 2022</xref>). Multimodal models ingest diverse data types (e.g., chemical structures, omics profiles, and bioactivity assays) simultaneously to capture complementary information. For example, M2REMAP is a multimodal deep learning framework that predicts drug indications, mono-drug side effects, and drug&#x2013;drug interaction side effects by integrating molecular chemical structures with clinical semantic embeddings derived from large-scale electronic health records (EHR). By learning joint representations across these heterogeneous modalities, M2REMAP achieves superior predictive accuracy and generalizability over unimodal baselines (<xref ref-type="bibr" rid="B118">Wen et al., 2023</xref>). Mart&#xed;nez et al. developed multi-task deep neural networks to simultaneously predict Ames mutagenicity across multiple Salmonella typhimurium strains (<xref ref-type="bibr" rid="B77">Mart&#xed;nez et al., 2022</xref>). They demonstrated that shared representations improved performance, especially on the strains with limited training data. Active learning enhances data efficiency by strategically selecting the most informative samples, enabling high model performance even with limited labeled data. For example, the muTOX-AL framework integrates structure-based and activity-based selection strategies to guide experimental toxicology, significantly improving model performance with fewer labeled compounds compared to random sampling (<xref ref-type="bibr" rid="B125">Xu et al., 2024</xref>). Federated learning enables multiple institutions to collaboratively train a global toxicity prediction model on decentralized datasets in which each party keeps its raw data locally and only shares model updates, thus preserving data privacy and regulatory compliance while benefiting from a much larger, heterogeneous training pool. The MELLODDY project exemplifies this approach, demonstrating that federated QSAR models trained across ten pharmaceutical companies achieved comparable or superior predictive performance to local models, while maintaining strict data confidentiality (<xref ref-type="bibr" rid="B44">Heyndrickx et al., 2023</xref>).</p>
<p>In parallel, interpretability techniques are also advancing to better inform and guide decision-making in drug discovery based on model predictions. SHAP estimates the contribution of each input feature to the output, providing insight into which molecular properties influence model decisions (<xref ref-type="bibr" rid="B75">Lundberg and Lee, 2017</xref>). For graph-based models, methods like EdgeSHAPer extend this concept by identifying important substructures within molecular graphs (<xref ref-type="bibr" rid="B78">Mastropietro et al., 2022</xref>). Attention-based visualizations, commonly used in transformer and graph neural network models, highlight which parts of the input the model focuses on during prediction (<xref ref-type="bibr" rid="B133">Ying et al., 2019</xref>; <xref ref-type="bibr" rid="B139">Zheng et al., 2019</xref>). For example, in SMILES-based models, attention heatmaps can reveal which atoms or functional groups are most influential in predicting toxicity. Counterfactual explanations, on the other hand, offer intuitive and sparse insights by showing the smallest alteration to input features that would change a model&#x2019;s prediction, particularly useful for understanding how minimal molecular changes affect outcomes. In drug design, small structural modifications can often result in counterfactual cases with significant impact on activity or toxicity, leading to growing interest in counterfactual explanation methods to better capture such subtle yet meaningful variations (<xref ref-type="bibr" rid="B117">Wellawatte et al., 2022</xref>).</p>
<p>Building on these recent advances, the next phase of toxicity prediction may be driven by foundation models and large-scale language-based systems. Looking ahead, emerging foundation models such as MoleculeGPT (<xref ref-type="bibr" rid="B74">Liu et al., 2024</xref>), BioT5 (<xref ref-type="bibr" rid="B90">Pei et al., 2023</xref>), and ChemCrow (<xref ref-type="bibr" rid="B12">Bran et al., 2024</xref>) could be applied to toxicity prediction. Even before the advent of large language models (LLMs), Papamokos and Silins demonstrated that integrating QSAR modeling with text mining improved the mechanistic understanding of carcinogenicity and helped compensate for limited structure&#x2013;activity data on non-genotoxic compounds (<xref ref-type="bibr" rid="B89">Papamokos and Silins, 2016</xref>). By linking chemical structures with literature-derived modes of action, their hybrid approach offered more biologically meaningful interpretations to support mechanism-based toxicity evaluation. Today, with the advent of powerful LLMs, such strategies can be further scaled and generalized. Fine-tuning these large, pre-trained models enables researchers to integrate broad and transferable chemical and biological knowledge into downstream toxicity prediction tasks, while producing mechanistically interpretable results even in data-scarce domains. These AI-driven methods not only improve predictive accuracy in data-scarce scenarios but are also continuing to advance rapidly, expanding the possibilities for mechanism-informed toxicology.</p>
</sec>
<sec id="s6">
<title>6 AI in regulatory toxicology</title>
<p>The use of AI-based models in regulatory toxicology is drawing growing interest, especially as agencies seek alternatives to animal testing. Yet, adoption remains limited due to the absence of clear validation standards and acceptance criteria. ICH guidelines, including M7 (R2), S2 (R1), and S1B(R1), provide frameworks for using <italic>in silico</italic> approaches such as AI-based models and advanced QSAR tools (ICH, 2022; 2023). These can support mutagenic impurity screening, genotoxicity testing, and carcinogenicity assessment, provided they are properly justified and validated. In this context, the FDA NCTR&#x2019;s AI4TOX program is specifically aimed at applying AI to toxicology to develop new tools that support FDA regulatory science and strengthen the safety review of FDA-regulated products (<xref ref-type="bibr" rid="B4">An FDA Artificial Intelligence, 2024</xref>). It focuses on leveraging AI for tasks like developing virtual animal models, evaluating toxicological endpoints, and analyzing complex data from FDA documents and histopathology. For broader adoption, AI models must align with regulatory expectations, demonstrate consistent performance, and offer interpretability.</p>
<p>As the use of AI in regulatory toxicology continues to expand, it becomes increasingly important to consider how existing validation principles can be adapted or extended to ensure these models meet regulatory standards. To enhance the reliability and regulatory acceptance of AI-based toxicity prediction models, it is useful to apply the OECD QSAR validation principles (<xref ref-type="bibr" rid="B87">OECD, 2014</xref>). Originally developed for traditional QSAR models, these principles outline key elements such as defined endpoints, transparent algorithms, applicability domains, performance metrics, and mechanistic interpretation when possible. While these criteria remain broadly relevant, the guidance was established before the advent of modern AI techniques. Given the rapid development of AI and its increasing integration into the drug discovery process, there is a growing need for updated validation frameworks that explicitly address the unique challenges and opportunities presented by AI-based modeling approaches.</p>
</sec>
<sec id="s7">
<title>7 Limitations, challenges, and future directions</title>
<p>The efficacy and safety of chemical compounds are fundamental considerations in drug discovery, with toxicity representing a key determinant of clinical success or failure. AI-based prediction models have emerged as powerful tools for toxicity assessment during the early stages of drug discovery. As databases continue to grow, computational resources become more accessible, and AI architectures evolve, these models have significantly advanced beyond traditional computational methods and enable reliable predictions across various toxicological endpoints, including hepatotoxicity, cardiotoxicity, nephrotoxicity, neurotoxicity, and genotoxicity. This review has systematically examined both general-purpose ADMET prediction tools and endpoint-specific toxicity models, highlighting rapid progress, increasing methodological sophistication, and expanding diversity within the field of computational toxicology. Nevertheless, several critical challenges persist. First of all, despite significant advances, current AI models frequently struggle with accurately predicting complex and rare toxicity events due to intrinsic biological complexities. The scarcity of high-quality labeled data, particularly data that accurately reflects clinical outcomes or rare toxicological events, severely constrains model training and validation. Also, generalizability to novel chemical scaffolds remains uncertain, limiting confidence in AI predictions for structurally diverse or innovative drug candidates. Finally, interpretability also remains a crucial bottleneck; although advanced AI models offer powerful predictive capabilities, their complex inner workings often limit the clarity and transparency required by regulatory bodies and clinical practitioners.</p>
<p>To overcome these limitations, future research can be focused on the integration of diverse data types, including detailed chemical structures, comprehensive biological assay outcomes, multi-omics profiles, and real-world clinical datasets. Such integration will enable AI models to capture the multifaceted nature of toxicological responses in a better way. Harmonizing toxicity annotations across multiple databases will also significantly enhance data interoperability, enabling more extensive and efficient utilization of available data resources. In parallel, fostering deeper cross-disciplinary collaboration among computational scientists, toxicologists, medicinal chemists, clinical pharmacologists, and regulatory experts is essential. Such collaborations can facilitate the development of predictive models that are not only robust and accurate but also practically interpretable, ensuring that model insights can directly inform discovery and regulatory decisions.</p>
<p>As AI technologies continue to evolve, it would be definite that they hold significant potential for enhancing early-stage decision-making, substantially reducing late-stage drug development failures, and accelerating the delivery of safer, more effective therapeutic solutions to patients. To fully employ this potential, it is crucial to foster a deeper understanding of the real-world implications and limitations of predictive outcomes. Practical integration requires not just technological advances but also a comprehensive awareness of pharmaceutical, clinical realities and regulatory standards. Thus, ongoing dialogue and knowledge-sharing between computational developers, experimental toxicologists, clinical researchers, and regulatory stakeholders will be indispensable in shaping the next-generation of AI-driven predictive toxicology tools that meaningfully improve drug discovery outcomes in both academic research and industry practice.</p>
</sec>
</body>
<back>
<sec sec-type="author-contributions" id="s8">
<title>Author contributions</title>
<p>HL: Investigation, Writing &#x2013; original draft. JK: Investigation, Visualization, Writing &#x2013; original draft. J-WK: Conceptualization, Project administration, Writing &#x2013; review and editing. YL: Conceptualization, Project administration, Resources, Supervision, Writing &#x2013; review and editing.</p>
</sec>
<sec sec-type="funding-information" id="s9">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This research was supported by the Korean Ministry of Environment under the Environmental Health R&#x26;D Program (No. 2021003310005) and the Chung-Ang University Research Grants in 2023.</p>
</sec>
<sec sec-type="COI-statement" id="s10">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s11">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
</sec>
<sec sec-type="disclaimer" id="s12">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ai</surname>
<given-names>H. X.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>L. C.</given-names>
</name>
<name>
<surname>Yin</surname>
<given-names>Z. M.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Predicting drug-induced liver injury using ensemble learning methods and molecular fingerprints</article-title>. <source>Toxicol. Sci.</source> <volume>165</volume> (<issue>1</issue>), <fpage>100</fpage>&#x2013;<lpage>107</lpage>. <pub-id pub-id-type="doi">10.1093/toxsci/kfy121</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Albert</surname>
<given-names>R. E.</given-names>
</name>
</person-group> (<year>1994</year>). <article-title>Carcinogen risk assessment in the us environmental-protection-agency</article-title>. <source>Crit. Rev. Toxicol.</source> <volume>24</volume> (<issue>1</issue>), <fpage>75</fpage>&#x2013;<lpage>85</lpage>. <pub-id pub-id-type="doi">10.3109/10408449409017920</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alves</surname>
<given-names>V. M.</given-names>
</name>
<name>
<surname>Muratov</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Fourches</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Strickland</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Kleinstreuer</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Andrade</surname>
<given-names>C. H.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Predicting chemically-induced skin reactions. Part I: QSAR models of skin sensitization and their application to identify potentially hazardous compounds</article-title>. <source>Toxicol. Appl. Pharmacol.</source> <volume>284</volume> (<issue>2</issue>), <fpage>262</fpage>&#x2013;<lpage>272</lpage>. <pub-id pub-id-type="doi">10.1016/j.taap.2014.12.014</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="web">
<collab>An FDA Artificial Intelligence (AI)</collab> (<year>2024</year>). <article-title>Program for toxicology</article-title>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.fda.gov/about-fda/nctr-research-focus-areas/artificial-intelligence">https://www.fda.gov/about-fda/nctr-research-focus-areas/artificial-intelligence</ext-link> (Accessed June 13, 2025)</comment>.</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ankley</surname>
<given-names>G. T.</given-names>
</name>
<name>
<surname>Bennett</surname>
<given-names>R. S.</given-names>
</name>
<name>
<surname>Erickson</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Hoff</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Hornung</surname>
<given-names>M. W.</given-names>
</name>
<name>
<surname>Johnson</surname>
<given-names>R. D.</given-names>
</name>
<etal/>
</person-group> (<year>2010</year>). <article-title>Adverse outcome pathways: a conceptual framework to support ecotoxicology research and risk assessment</article-title>. <source>Environ. Toxicol. Chem.</source> <volume>29</volume> (<issue>3</issue>), <fpage>730</fpage>&#x2013;<lpage>741</lpage>. <pub-id pub-id-type="doi">10.1002/etc.34</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Babai</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Auclert</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Le-Louet</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Safety data and withdrawal of hepatotoxic drugs</article-title>. <source>Therapie</source> <volume>76</volume> (<issue>6</issue>), <fpage>715</fpage>&#x2013;<lpage>723</lpage>. <pub-id pub-id-type="doi">10.1016/j.therap.2018.02.004</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Banerjee</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Kemmler</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Dunkel</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Preissner</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>ProTox 3.0: a webserver for the prediction of toxicity of chemicals</article-title>. <source>Nucleic Acids Res.</source> <volume>52</volume> (<issue>W1</issue>), <fpage>W513</fpage>&#x2013;<lpage>W520</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkae303</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Barnes</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Zubair</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>John</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Poirier</surname>
<given-names>M. C.</given-names>
</name>
<name>
<surname>Martin</surname>
<given-names>F. L.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Carcinogens and DNA damage</article-title>. <source>Biochem. Soc. Trans.</source> <volume>46</volume> (<issue>5</issue>), <fpage>1213</fpage>&#x2013;<lpage>1224</lpage>. <pub-id pub-id-type="doi">10.1042/Bst20180519</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Basu</surname>
<given-names>A. K.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>DNA damage, mutagenesis and cancer</article-title>. <source>Int. J. Mol. Sci.</source> <volume>19</volume> (<issue>4</issue>), <fpage>970</fpage>. <pub-id pub-id-type="doi">10.3390/ijms19040970</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Benigni</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Battistelli</surname>
<given-names>C. L.</given-names>
</name>
<name>
<surname>Bossa</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Tcheremenskaia</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Crettaz</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>New perspectives in toxicological information management, and the role of ISSTOX databases in assessing chemical mutagenicity and carcinogenicity</article-title>. <source>Mutagenesis</source> <volume>28</volume> (<issue>4</issue>), <fpage>401</fpage>&#x2013;<lpage>409</lpage>. <pub-id pub-id-type="doi">10.1093/mutage/get016</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Benigni</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Bossa</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Richard</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>C. H.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>A novel approach: chemical relational databases, and the role of the ISSCAN database on assessing chemical carcinogenicity</article-title>. <source>Ann. Dell Ist. Super. Di Sanita</source> <volume>44</volume> (<issue>1</issue>), <fpage>48</fpage>&#x2013;<lpage>56</lpage>.</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bran</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Cox</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Schilter</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Baldassari</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>White</surname>
<given-names>A. D.</given-names>
</name>
<name>
<surname>Schwaller</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Augmenting large language models with chemistry tools</article-title>. <source>Nat. Mach. Intell.</source> <volume>6</volume> (<issue>5</issue>), <fpage>525</fpage>&#x2013;<lpage>535</lpage>. <pub-id pub-id-type="doi">10.1038/s42256-024-00832-8</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cai</surname>
<given-names>C. P.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>P. F.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Y. D.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>J. W.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>F. X.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Deep learning-based prediction of drug-induced cardiotoxicity</article-title>. <source>J. Chem. Inf. Model.</source> <volume>59</volume> (<issue>3</issue>), <fpage>1073</fpage>&#x2013;<lpage>1084</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jcim.8b00769</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cavasotto</surname>
<given-names>C. N.</given-names>
</name>
<name>
<surname>Scardino</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Machine learning toxicity prediction: latest advances by toxicity end point</article-title>. <source>Acs Omega</source> <volume>7</volume> (<issue>51</issue>), <fpage>47536</fpage>&#x2013;<lpage>47546</lpage>. <pub-id pub-id-type="doi">10.1021/acsomega.2c05693</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Celik</surname>
<given-names>F. K.</given-names>
</name>
<name>
<surname>Karaduman</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Machine learning-based prediction of drug-induced hepatotoxicity: an OvA-QSTR approach</article-title>. <source>J. Chem. Inf. Model.</source> <volume>63</volume> (<issue>15</issue>), <fpage>4602</fpage>&#x2013;<lpage>4614</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jcim.3c00687</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>C. Y. C.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>TCM Database@Taiwan: the world&#x27;s largest traditional Chinese medicine database for drug screening <italic>in silico</italic>
</article-title>. <source>Plos One</source> <volume>6</volume> (<issue>1</issue>), <fpage>e15939</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0015939</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Borlak</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>W. D.</given-names>
</name>
</person-group> (<year>2013a</year>). <article-title>High lipophilicity and high daily dose of oral medications are associated with significant risk for drug-induced liver injury</article-title>. <source>Hepatology</source> <volume>58</volume> (<issue>1</issue>), <fpage>388</fpage>&#x2013;<lpage>396</lpage>. <pub-id pub-id-type="doi">10.1002/hep.26208</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>H. X.</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Kelly</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>G. X.</given-names>
</name>
<name>
<surname>Borlak</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2013b</year>). <article-title>Quantitative structure-activity relationship models for predicting drug-induced liver injury based on FDA-approved drug labeling annotation and using a large collection of drugs</article-title>. <source>Toxicol. Sci.</source> <volume>136</volume> (<issue>1</issue>), <fpage>242</fpage>&#x2013;<lpage>249</lpage>. <pub-id pub-id-type="doi">10.1093/toxsci/kft189</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Suzuki</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Thakkar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>C. C.</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>W. D.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>DILIrank: the largest reference drug list ranked by the risk for developing drug-induced liver injury in humans</article-title>. <source>Drug Discov. Today</source> <volume>21</volume> (<issue>4</issue>), <fpage>648</fpage>&#x2013;<lpage>653</lpage>. <pub-id pub-id-type="doi">10.1016/j.drudis.2016.02.015</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Vijay</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z. C.</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>W. D.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>FDA-approved drug labeling for the study of drug-induced liver injury</article-title>. <source>Drug Discov. Today</source> <volume>16</volume> (<issue>15-16</issue>), <fpage>697</fpage>&#x2013;<lpage>703</lpage>. <pub-id pub-id-type="doi">10.1016/j.drudis.2011.05.007</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X. Y.</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Qiu</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>ResNet18DNN: prediction approach of drug-induced liver injury by deep neural network with ResNet18</article-title>. <source>Briefings Bioinforma.</source> <volume>23</volume> (<issue>1</issue>), <fpage>bbab503</fpage>. <pub-id pub-id-type="doi">10.1093/bib/bbab503</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>J. Q.</given-names>
</name>
<name>
<surname>Meng</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Yin</surname>
<given-names>S. D.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>Q.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>DCAMCP: a deep learning model based on capsule network and attention mechanism for molecular carcinogenicity prediction</article-title>. <source>J. Cell. Mol. Med.</source> <volume>27</volume> (<issue>20</issue>), <fpage>3117</fpage>&#x2013;<lpage>3126</lpage>. <pub-id pub-id-type="doi">10.1111/jcmm.17889</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Didziapetris</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Lanevskij</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Compilation and physicochemical classification analysis of a diverse hERG inhibition database</article-title>. <source>J. Computer-Aided Mol. Des.</source> <volume>30</volume> (<issue>12</issue>), <fpage>1175</fpage>&#x2013;<lpage>1188</lpage>. <pub-id pub-id-type="doi">10.1007/s10822-016-9986-0</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dimitrov</surname>
<given-names>S. D.</given-names>
</name>
<name>
<surname>Diderich</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Sobanski</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Pavlov</surname>
<given-names>T. S.</given-names>
</name>
<name>
<surname>Chankov</surname>
<given-names>G. V.</given-names>
</name>
<name>
<surname>Chapkanov</surname>
<given-names>A. S.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>QSAR Toolbox - workflow and major functionalities</article-title>. <source>Sar Qsar Environ. Res.</source> <volume>27</volume> (<issue>3</issue>), <fpage>203</fpage>&#x2013;<lpage>219</lpage>. <pub-id pub-id-type="doi">10.1080/1062936x.2015.1136680</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Doddareddy</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Klaasse</surname>
<given-names>E. C.</given-names>
</name>
<name>
<surname>Ijzerman</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Bender</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Prospective validation of a comprehensive <italic>in silico</italic> hERG model and its applications to commercial compound and drug databases</article-title>. <source>Chemmedchem</source> <volume>5</volume> (<issue>5</issue>), <fpage>716</fpage>&#x2013;<lpage>729</lpage>. <pub-id pub-id-type="doi">10.1002/cmdc.201000024</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Du</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>H. B.</given-names>
</name>
<name>
<surname>Zou</surname>
<given-names>B. Y.</given-names>
</name>
<name>
<surname>Babcock</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Long</surname>
<given-names>S. Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>hERGCentral: a large database to store, retrieve, and analyze compound-human <italic>ether-&#xe0;-go-go</italic> related gene channel interactions to facilitate cardiotoxicity assessment in drug development</article-title>. <source>Assay Drug Dev. Technol.</source> <volume>9</volume> (<issue>6</issue>), <fpage>580</fpage>&#x2013;<lpage>588</lpage>. <pub-id pub-id-type="doi">10.1089/adt.2011.0425</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Duffus</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>1993</year>). <article-title>Glossary for chemists of terms used in toxicology (IUPAC Recommendations 1993)</article-title>. <source>Pure Appl. Chem.</source> <volume>65</volume> (<issue>9</issue>), <fpage>2003</fpage>&#x2013;<lpage>2122</lpage>. <pub-id pub-id-type="doi">10.1351/pac199365092003</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<collab>FDA</collab> (<year>2005</year>). <article-title>International conference on harmonisation; guidance on S7B nonclinical evaluation of the potential for delayed ventricular repolarization (QT interval prolongation) by human pharmaceuticals; availability. Notice</article-title>. <source>Fed. Regist.</source> <volume>70</volume>, <fpage>61133</fpage>&#x2013;<lpage>61134</lpage>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/pubmed/16237859">https://www.ncbi.nlm.nih.gov/pubmed/16237859</ext-link>.</comment>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ferguson</surname>
<given-names>L. R.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Chronic inflammation and mutagenesis</article-title>. <source>Mutat. Research/Fundamental Mol. Mech. Mutagen.</source> <volume>690</volume> (<issue>1-2</issue>), <fpage>3</fpage>&#x2013;<lpage>11</lpage>. <pub-id pub-id-type="doi">10.1016/j.mrfmmm.2010.03.007</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Foulds</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Trevino</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>York</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Walker</surname>
<given-names>C. L.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Endocrine-disrupting chemicals and fatty liver disease</article-title>. <source>Nat. Rev. Endocrinol.</source> <volume>13</volume> (<issue>8</issue>), <fpage>445</fpage>&#x2013;<lpage>457</lpage>. <pub-id pub-id-type="doi">10.1038/nrendo.2017.42</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fournier</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Vroland</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Megy</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Aguero</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Chemelle</surname>
<given-names>J. A.</given-names>
</name>
<name>
<surname>Defoort</surname>
<given-names>B.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>
<italic>In silico</italic> genotoxicity prediction by similarity search and machine learning algorithm: optimization and validation of the method for high energetic materials</article-title>. <source>Propellants Explos. Pyrotech.</source> <volume>48</volume> (<issue>4</issue>), <fpage>e202200259</fpage>. <pub-id pub-id-type="doi">10.1002/prep.202200259</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>S. H.</given-names>
</name>
<name>
<surname>Yi</surname>
<given-names>J. C.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>N. N.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>Y. H.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Z. X.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>ADMETlab 3.0: an updated comprehensive online ADMET prediction platform enhanced with broader coverage, improved performance, API functionality and decision support</article-title>. <source>Nucleic Acids Res.</source> <volume>52</volume> (<issue>W1</issue>), <fpage>W422</fpage>&#x2013;<lpage>W431</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkae236</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gadaleta</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Sp&#xee;nu</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Roncaglioni</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Cronin</surname>
<given-names>M. T. D.</given-names>
</name>
<name>
<surname>Benfenati</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Prediction of the neurotoxic potential of chemicals based on modelling of molecular initiating events upstream of the adverse outcome pathways of (developmental) neurotoxicity</article-title>. <source>Int. J. Mol. Sci.</source> <volume>23</volume> (<issue>6</issue>), <fpage>3053</fpage>. <pub-id pub-id-type="doi">10.3390/ijms23063053</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gaulton</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hersey</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Nowotka</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bento</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Chambers</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Mendez</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>The ChEMBL database in 2017</article-title>. <source>Nucleic Acids Res.</source> <volume>45</volume> (<issue>D1</issue>), <fpage>D945</fpage>&#x2013;<lpage>D954</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkw1074</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gayvert</surname>
<given-names>K. M.</given-names>
</name>
<name>
<surname>Madhukar</surname>
<given-names>N. S.</given-names>
</name>
<name>
<surname>Elemento</surname>
<given-names>O.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>A data-driven approach to predicting successes and failures of clinical trials</article-title>. <source>Cell Chem. Biol.</source> <volume>23</volume> (<issue>10</issue>), <fpage>1294</fpage>&#x2013;<lpage>1301</lpage>. <pub-id pub-id-type="doi">10.1016/j.chembiol.2016.07.023</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ghane Shahrbaf</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Assadi</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Drug-induced renal disorders</article-title>. <source>J. Ren. Inj. Prev.</source> <volume>4</volume> (<issue>3</issue>), <fpage>57</fpage>&#x2013;<lpage>60</lpage>. <pub-id pub-id-type="doi">10.12861/jrip.2015.12</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gold</surname>
<given-names>L. S.</given-names>
</name>
<name>
<surname>Manley</surname>
<given-names>N. B.</given-names>
</name>
<name>
<surname>Slone</surname>
<given-names>T. H.</given-names>
</name>
<name>
<surname>Rohrbach</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Garfinkel</surname>
<given-names>G. B.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Supplement to the carcinogenic potency database (CPDB): results of animal bioassays published in the general literature through 1997 and by the national toxicology program in 1997-1998</article-title>. <source>Toxicol. Sci.</source> <volume>85</volume> (<issue>2</issue>), <fpage>747</fpage>&#x2013;<lpage>808</lpage>. <pub-id pub-id-type="doi">10.1093/toxsci/kfi161</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gong</surname>
<given-names>Y. N.</given-names>
</name>
<name>
<surname>Teng</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y. M.</given-names>
</name>
<name>
<surname>Gu</surname>
<given-names>Y. X.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Z. R.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>W. H.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>
<italic>In silico</italic> prediction of potential drug-induced nephrotoxicity with machine learning methods</article-title>. <source>J. Appl. Toxicol.</source> <volume>42</volume> (<issue>10</issue>), <fpage>1639</fpage>&#x2013;<lpage>1650</lpage>. <pub-id pub-id-type="doi">10.1002/jat.4331</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Greene</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Fisk</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Naven</surname>
<given-names>R. T.</given-names>
</name>
<name>
<surname>Note</surname>
<given-names>R. R.</given-names>
</name>
<name>
<surname>Patel</surname>
<given-names>M. L.</given-names>
</name>
<name>
<surname>Pelletier</surname>
<given-names>D. J.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Developing structure-activity relationships for the prediction of hepatotoxicity</article-title>. <source>Chem. Res. Toxicol.</source> <volume>23</volume> (<issue>7</issue>), <fpage>1215</fpage>&#x2013;<lpage>1222</lpage>. <pub-id pub-id-type="doi">10.1021/tx1000865</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gu</surname>
<given-names>X. S.</given-names>
</name>
<name>
<surname>Manautou</surname>
<given-names>J. E.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Molecular mechanisms underlying chemical liver injury</article-title>. <source>Expert Rev. Mol. Med.</source> <volume>14</volume>, <fpage>e4</fpage>. <pub-id pub-id-type="doi">10.1017/S1462399411002110</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hansen</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Mika</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Schroeter</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Sutter</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>ter Laak</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Steger-Hartmann</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2009</year>). <article-title>Benchmark data set for <italic>in silico</italic> prediction of ames mutagenicity</article-title>. <source>J. Chem. Inf. Model.</source> <volume>49</volume> (<issue>9</issue>), <fpage>2077</fpage>&#x2013;<lpage>2081</lpage>. <pub-id pub-id-type="doi">10.1021/ci900161g</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Heeren</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Scheja</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Metabolic-associated fatty liver disease and lipoprotein metabolism</article-title>. <source>Mol. Metab.</source> <volume>50</volume>, <fpage>101238</fpage>. <pub-id pub-id-type="doi">10.1016/j.molmet.2021.101238</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Heyndrickx</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Mervin</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Morawietz</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Sturm</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Friedrich</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zalewski</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>MELLODDY: cross-pharma federated learning at unprecedented scale unlocks benefits in QSAR without compromising proprietary information</article-title>. <source>J. Chem. Inf. Model.</source> <volume>64</volume> (<issue>7</issue>), <fpage>2331</fpage>&#x2013;<lpage>2344</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jcim.3c00799</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hoofnagle</surname>
<given-names>J. H.</given-names>
</name>
<name>
<surname>Serrano</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Knoben</surname>
<given-names>J. E.</given-names>
</name>
<name>
<surname>Navarro</surname>
<given-names>V. J.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>LiverTox: a website on drug-induced liver injury</article-title>. <source>Hepatology</source> <volume>57</volume> (<issue>3</issue>), <fpage>873</fpage>&#x2013;<lpage>874</lpage>. <pub-id pub-id-type="doi">10.1002/hep.26175</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="web">
<collab>ICH</collab> (<year>2020</year>). <article-title>S2(R1) genotoxicity testing and data interpretation for pharmaceuticals intended for human use</article-title>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.fda.gov/regulatory-information/search-fda-guidance-documents/s2r1-genotoxicity-testing-and-data-interpretation-pharmaceuticals-intended-human-use">https://www.fda.gov/regulatory-information/search-fda-guidance-documents/s2r1-genotoxicity-testing-and-data-interpretation-pharmaceuticals-intended-human-use</ext-link>.</comment>
</citation>
</ref>
<ref id="B47">
<citation citation-type="web">
<collab>ICH</collab> (<year>2022</year>). <article-title>S1B(R1) addendum to S1B testing for carcinogenicity of pharmaceuticals</article-title>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.fda.gov/regulatory-information/search-fda-guidance-documents/s1br1-addendum-s1b-testing-carcinogenicity-pharmaceuticals">https://www.fda.gov/regulatory-information/search-fda-guidance-documents/s1br1-addendum-s1b-testing-carcinogenicity-pharmaceuticals</ext-link>.</comment>
</citation>
</ref>
<ref id="B48">
<citation citation-type="web">
<collab>ICH</collab> (<year>2023</year>). <article-title>M7(R2) assessment and control of DNA reactive (mutagenic) impurities in pharmaceuticals to limit potential carcinogenic risk</article-title>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.fda.gov/regulatory-information/search-fda-guidance-documents/guidance-industry-m7r2-assessment-and-control-dna-reactive-mutagenic-impurities-pharmaceuticals">https://www.fda.gov/regulatory-information/search-fda-guidance-documents/guidance-industry-m7r2-assessment-and-control-dna-reactive-mutagenic-impurities-pharmaceuticals</ext-link>.</comment>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiang</surname>
<given-names>C. S.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>P. P.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>W. H.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>G. X.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>
<italic>In silico</italic> prediction of chemical neurotoxicity using machine learning</article-title>. <source>Toxicol. Res.</source> <volume>9</volume> (<issue>3</issue>), <fpage>164</fpage>&#x2013;<lpage>172</lpage>. <pub-id pub-id-type="doi">10.1093/toxres/tfaa016</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiang</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Z. X.</given-names>
</name>
<name>
<surname>Hsieh</surname>
<given-names>C. Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>G. Y.</given-names>
</name>
<name>
<surname>Liao</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Could graph neural networks learn better molecular representation for drug discovery? A comparison study of descriptor-based and graph-based models</article-title>. <source>J. Cheminformatics</source> <volume>13</volume> (<issue>1</issue>), <fpage>12</fpage>. <pub-id pub-id-type="doi">10.1186/s13321-020-00479-8</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Karim</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Balle</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Sattar</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>CardioTox net: a robust predictor for hERG channel blockade based on deep learning meta-feature ensembles</article-title>. <source>J. Cheminformatics</source> <volume>13</volume> (<issue>1</issue>), <fpage>60</fpage>. <pub-id pub-id-type="doi">10.1186/s13321-021-00541-z</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Nam</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>BayeshERG: a robust, reliable and interpretable deep learning model for predicting hERG channel blockers</article-title>. <source>Briefings Bioinforma.</source> <volume>23</volume> (<issue>4</issue>), <fpage>bbac211</fpage>. <pub-id pub-id-type="doi">10.1093/bib/bbac211</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Thiessen</surname>
<given-names>P. A.</given-names>
</name>
<name>
<surname>Bolton</surname>
<given-names>E. E.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Gindulyte</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>PubChem substance and compound databases</article-title>. <source>Nucleic Acids Res.</source> <volume>44</volume> (<issue>D1</issue>), <fpage>D1202</fpage>&#x2013;<lpage>D1213</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkv951</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kocot-Kepska</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zajaczkowska</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Mika</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wordliczek</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Dobrogowski</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Przeklasa-Muszynska</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Peripheral mechanisms of neuropathic pain-the role of neuronal and non-neuronal interactions and their implications for topical treatment of neuropathic pain</article-title>. <source>Pharmaceuticals</source> <volume>14</volume> (<issue>2</issue>), <fpage>77</fpage>. <pub-id pub-id-type="doi">10.3390/ph14020077</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Konda</surname>
<given-names>L. S. K. P. S. K.</given-names>
</name>
<name>
<surname>Kristam</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>hERG liability classification models using machine learning techniques</article-title>. <source>Comput. Toxicol.</source> <volume>12</volume>, <fpage>100089</fpage>. <pub-id pub-id-type="doi">10.1016/j.comtox.2019.100089</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kosnik</surname>
<given-names>M. B.</given-names>
</name>
<name>
<surname>Strickland</surname>
<given-names>J. D.</given-names>
</name>
<name>
<surname>Marvel</surname>
<given-names>S. W.</given-names>
</name>
<name>
<surname>Wallis</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Wallace</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Richard</surname>
<given-names>A. M.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Concentration-response evaluation of ToxCast compounds for multivariate activity patterns of neural network function</article-title>. <source>Archives Toxicol.</source> <volume>94</volume> (<issue>2</issue>), <fpage>469</fpage>&#x2013;<lpage>484</lpage>. <pub-id pub-id-type="doi">10.1007/s00204-019-02636-x</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kotsampasakou</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Ecker</surname>
<given-names>G. F.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Predicting drug-induced cholestasis with the help of hepatic transporters&#x2014;an <italic>in silico</italic> modeling approach</article-title>. <source>J. Chem. Inf. Model.</source> <volume>57</volume> (<issue>3</issue>), <fpage>608</fpage>&#x2013;<lpage>615</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jcim.6b00518</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kragstrup</surname>
<given-names>T. W.</given-names>
</name>
<name>
<surname>Glintborg</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Svensson</surname>
<given-names>A. L.</given-names>
</name>
<name>
<surname>McMaster</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Robinson</surname>
<given-names>P. C.</given-names>
</name>
<name>
<surname>Deleuran</surname>
<given-names>B.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Waiting for JAK inhibitor safety data</article-title>. <source>Rmd Open</source> <volume>8</volume> (<issue>1</issue>), <fpage>e002236</fpage>. <pub-id pub-id-type="doi">10.1136/rmdopen-2022-002236</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Krewski</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Acosta</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Andersen</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Anderson</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Bailar</surname>
<given-names>J. C.</given-names>
</name>
<name>
<surname>Boekelheide</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2010</year>). <article-title>Toxicity testing in the 21st century: a vision and a strategy</article-title>. <source>J. Toxicol. Environ. Health-Part B-Critical Rev.</source> <volume>13</volume> (<issue>2-4</issue>), <fpage>51</fpage>&#x2013;<lpage>138</lpage>. <pub-id pub-id-type="doi">10.1080/10937404.2010.483176</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kuhn</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Letunic</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Jensen</surname>
<given-names>L. J.</given-names>
</name>
<name>
<surname>Bork</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>The SIDER database of drugs and side effects</article-title>. <source>Nucleic Acids Res.</source> <volume>44</volume> (<issue>D1</issue>), <fpage>D1075</fpage>&#x2013;<lpage>D1079</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkv1075</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lagunin</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Filimonov</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Zakharov</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>F. C.</given-names>
</name>
<etal/>
</person-group> (<year>2009</year>). <article-title>Computer-aided prediction of rodent carcinogenicity by PASS and CISOC-psct</article-title>. <source>Qsar and Comb. Sci.</source> <volume>28</volume> (<issue>8</issue>), <fpage>806</fpage>&#x2013;<lpage>810</lpage>. <pub-id pub-id-type="doi">10.1002/qsar.200860192</pub-id>
</citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lanevskij</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Didziapetris</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Sazonovas</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Physicochemical QSAR analysis of hERG inhibition revisited: towards a quantitative potency prediction</article-title>. <source>J. Computer-Aided Mol. Des.</source> <volume>36</volume> (<issue>12</issue>), <fpage>837</fpage>&#x2013;<lpage>849</lpage>. <pub-id pub-id-type="doi">10.1007/s10822-022-00483-0</pub-id>
</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Yoo</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>hERGAT: predicting hERG blockers using graph attention mechanism through atom- and molecule-level interaction analyses</article-title>. <source>J. Cheminformatics</source> <volume>17</volume> (<issue>1</issue>), <fpage>11</fpage>. <pub-id pub-id-type="doi">10.1186/s13321-025-00957-x</pub-id>
</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Yoo</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>InterDILI: interpretable prediction of drug-induced liver injury through permutation feature importance and attention mechanism</article-title>. <source>J. Cheminformatics</source> <volume>16</volume> (<issue>1</issue>), <fpage>1</fpage>. <pub-id pub-id-type="doi">10.1186/s13321-023-00796-8</pub-id>
</citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Legradi</surname>
<given-names>J. B.</given-names>
</name>
<name>
<surname>Di Paolo</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Kraak</surname>
<given-names>M. H. S.</given-names>
</name>
<name>
<surname>van der Geest</surname>
<given-names>H. G.</given-names>
</name>
<name>
<surname>Schymanski</surname>
<given-names>E. L.</given-names>
</name>
<name>
<surname>Williams</surname>
<given-names>A. J.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>An ecotoxicological view on neurotoxicity assessment</article-title>. <source>Environ. Sci. Eur.</source> <volume>30</volume>, <fpage>46</fpage>&#x2013;<lpage>34</lpage>. <pub-id pub-id-type="doi">10.1186/s12302-018-0173-x</pub-id>
</citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>Q. Y.</given-names>
</name>
<name>
<surname>Jorgensen</surname>
<given-names>F. S.</given-names>
</name>
<name>
<surname>Oprea</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Brunak</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Taboureau</surname>
<given-names>O.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>hERG classification model based on a combination of support vector machine method and GRIND descriptors</article-title>. <source>Mol. Pharm.</source> <volume>5</volume> (<issue>1</issue>), <fpage>117</fpage>&#x2013;<lpage>127</lpage>. <pub-id pub-id-type="doi">10.1021/mp700124e</pub-id>
</citation>
</ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>H. W.</given-names>
</name>
<name>
<surname>Meng</surname>
<given-names>J. H.</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Yi</surname>
<given-names>L. W.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>MutagenPred-GCNNs: a graph convolutional neural network-based classification model for mutagenicity prediction with data-driven molecular fingerprints</article-title>. <source>Interdiscip. Sciences-Computational Life Sci.</source> <volume>13</volume> (<issue>1</issue>), <fpage>25</fpage>&#x2013;<lpage>33</lpage>. <pub-id pub-id-type="doi">10.1007/s12539-020-00407-2</pub-id>
</citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>W. D.</given-names>
</name>
<name>
<surname>Roberts</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z. C.</given-names>
</name>
<name>
<surname>Thakkar</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>DeepCarc: deep learning-powered carcinogenicity prediction using model-level representation</article-title>. <source>Front. Artif. Intell.</source> <volume>4</volume>, <fpage>757780</fpage>. <pub-id pub-id-type="doi">10.3389/frai.2021.757780</pub-id>
</citation>
</ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liew</surname>
<given-names>C. Y.</given-names>
</name>
<name>
<surname>Lim</surname>
<given-names>Y. C.</given-names>
</name>
<name>
<surname>Yap</surname>
<given-names>C. W.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Mixed learning algorithms and features ensemble in hepatotoxicity prediction</article-title>. <source>J. Computer-Aided Mol. Des.</source> <volume>25</volume> (<issue>9</issue>), <fpage>855</fpage>&#x2013;<lpage>871</lpage>. <pub-id pub-id-type="doi">10.1007/s10822-011-9468-3</pub-id>
</citation>
</ref>
<ref id="B70">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>A. N. K.</given-names>
</name>
<name>
<surname>Seal</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>H. B.</given-names>
</name>
<name>
<surname>Bender</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Using chemical and biological data to predict drug toxicity</article-title>. <source>Slas Discov.</source> <volume>28</volume> (<issue>3</issue>), <fpage>53</fpage>&#x2013;<lpage>64</lpage>. <pub-id pub-id-type="doi">10.1016/j.slasd.2022.12.003</pub-id>
</citation>
</ref>
<ref id="B71">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>L. L.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>H. W.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Prediction of the blood-brain barrier (BBB) permeability of chemicals based on machine-learning and ensemble methods</article-title>. <source>Chem. Res. Toxicol.</source> <volume>34</volume> (<issue>6</issue>), <fpage>1456</fpage>&#x2013;<lpage>1467</lpage>. <pub-id pub-id-type="doi">10.1021/acs.chemrestox.0c00343</pub-id>
</citation>
</ref>
<ref id="B72">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>T. Z.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>L. L.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Prediction of hERG potassium channel blockage using ensemble learning methods and molecular fingerprints</article-title>. <source>Toxicol. Lett.</source> <volume>332</volume>, <fpage>88</fpage>&#x2013;<lpage>96</lpage>. <pub-id pub-id-type="doi">10.1016/j.toxlet.2020.07.003</pub-id>
</citation>
</ref>
<ref id="B73">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>T. Q.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>Y. M.</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Jorissen</surname>
<given-names>R. N.</given-names>
</name>
<name>
<surname>Gilson</surname>
<given-names>M. K.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>BindingDB: a web-accessible database of experimentally determined protein-ligand binding affinities</article-title>. <source>Nucleic Acids Res.</source> <volume>35</volume>, <fpage>D198</fpage>&#x2013;<lpage>D201</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkl999</pub-id>
</citation>
</ref>
<ref id="B74">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Tan</surname>
<given-names>Q.</given-names>
</name>
</person-group> (<year>2024</year>). <source>Moleculargpt: open large language model (llm) for few-shot molecular property prediction</source>. <comment>arXiv:2406</comment>.<fpage>12950</fpage>
</citation>
</ref>
<ref id="B75">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Lundberg</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>S. I.</given-names>
</name>
</person-group> (<year>2017</year>). &#x201c;<article-title>A unified approach to interpreting model predictions</article-title>,&#x201d; in <conf-name>NIPS&#x27;17: Proceedings of the 31st International Conference on Neural Information Processing Systems</conf-name>, <conf-loc>Long Beach California USA</conf-loc>, <conf-date>December 4 - 9, 2017</conf-date>, <fpage>4768</fpage>&#x2013;<lpage>4777</lpage>.)</citation>
</ref>
<ref id="B76">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mak</surname>
<given-names>K. K.</given-names>
</name>
<name>
<surname>Pichika</surname>
<given-names>M. R.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Artificial intelligence in drug development: present status and future prospects</article-title>. <source>Drug Discov. Today</source> <volume>24</volume> (<issue>3</issue>), <fpage>773</fpage>&#x2013;<lpage>780</lpage>. <pub-id pub-id-type="doi">10.1016/j.drudis.2018.11.014</pub-id>
</citation>
</ref>
<ref id="B77">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mart&#xed;nez</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Sabando</surname>
<given-names>M. V.</given-names>
</name>
<name>
<surname>Soto</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Roca</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Requena-Triguero</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Campillo</surname>
<given-names>N. E.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Multitask deep neural networks for ames mutagenicity prediction</article-title>. <source>J. Chem. Inf. Model.</source> <volume>62</volume> (<issue>24</issue>), <fpage>6342</fpage>&#x2013;<lpage>6351</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jcim.2c00532</pub-id>
</citation>
</ref>
<ref id="B78">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mastropietro</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Pasculli</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Feldmann</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Rodr&#xed;guez-P&#xe9;rez</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Bajorath</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>EdgeSHAPer: bond-centric Shapley value-based explanation method for graph neural networks</article-title>. <source>Iscience</source> <volume>25</volume> (<issue>10</issue>), <fpage>105043</fpage>. <pub-id pub-id-type="doi">10.1016/j.isci.2022.105043</pub-id>
</citation>
</ref>
<ref id="B79">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mazumdar</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Sarma</surname>
<given-names>P. K. D.</given-names>
</name>
<name>
<surname>Mahanta</surname>
<given-names>H. J.</given-names>
</name>
<name>
<surname>Sastry</surname>
<given-names>G. N.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Machine learning based dynamic consensus model for predicting blood-brain barrier permeability</article-title>. <source>Comput. Biol. Med.</source> <volume>160</volume>, <fpage>106984</fpage>. <pub-id pub-id-type="doi">10.1016/j.compbiomed.2023.106984</pub-id>
</citation>
</ref>
<ref id="B80">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>McNaught</surname>
<given-names>A. D.</given-names>
</name>
<name>
<surname>Wilkinson</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2025</year>). <source>&#x27;toxicity&#x27; in IUPAC compendium of chemical terminology</source>. <edition>5th ed.</edition> <publisher-loc>IUPAC</publisher-loc>: <publisher-name>International Union of Pure and Applied Chemistry</publisher-name>.</citation>
</ref>
<ref id="B81">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mulliner</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Schmidt</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Stolte</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Spirkl</surname>
<given-names>H. P.</given-names>
</name>
<name>
<surname>Czich</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Amberg</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Computational models for human and animal hepatotoxicity with a global application scope</article-title>. <source>Chem. Res. Toxicol.</source> <volume>29</volume> (<issue>5</issue>), <fpage>757</fpage>&#x2013;<lpage>767</lpage>. <pub-id pub-id-type="doi">10.1021/acs.chemrestox.5b00465</pub-id>
</citation>
</ref>
<ref id="B82">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Munawar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Vandenberg</surname>
<given-names>J. I.</given-names>
</name>
<name>
<surname>Jabeen</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Molecular docking guided grid-independent descriptor analysis to probe the impact of water molecules on conformational changes of hERG inhibitors in drug trapping phenomenon</article-title>. <source>Int. J. Mol. Sci.</source> <volume>20</volume> (<issue>14</issue>), <fpage>3385</fpage>. <pub-id pub-id-type="doi">10.3390/ijms20143385</pub-id>
</citation>
</ref>
<ref id="B83">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Myung</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>de Sa</surname>
<given-names>A. G. C.</given-names>
</name>
<name>
<surname>Ascher</surname>
<given-names>D. B.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Deep-PK: deep learning for small molecule pharmacokinetic and toxicity prediction</article-title>. <source>Nucleic Acids Res.</source> <volume>52</volume> (<issue>W1</issue>), <fpage>W469</fpage>&#x2013;<lpage>W475</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkae254</pub-id>
</citation>
</ref>
<ref id="B84">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Negami</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Araki</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Okuno</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Terada</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Calculation of absolute binding free energies between the hERG channel and structurally diverse drugs</article-title>. <source>Sci. Rep.</source> <volume>9</volume> (<issue>1</issue>), <fpage>16586</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-019-53120-6</pub-id>
</citation>
</ref>
<ref id="B85">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nohmi</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Thresholds of genotoxic and non-genotoxic carcinogens</article-title>. <source>Toxicol. Res.</source> <volume>34</volume> (<issue>4</issue>), <fpage>281</fpage>&#x2013;<lpage>290</lpage>. <pub-id pub-id-type="doi">10.5487/Tr.2018.34.4.281</pub-id>
</citation>
</ref>
<ref id="B86">
<citation citation-type="book">
<collab>NRC</collab> (<year>1994</year>). <source>Science and judgment in risk assessment<italic>. National research Council (US) Committee on risk Assessment of hazardous air pollutants</italic>
</source>. <publisher-loc>Washington (DC)</publisher-loc>: <publisher-name>National Academies Press US</publisher-name>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/books/NBK208246/">https://www.ncbi.nlm.nih.gov/books/NBK208246/</ext-link>.</comment>
</citation>
</ref>
<ref id="B87">
<citation citation-type="book">
<collab>OECD</collab> (<year>2014</year>). &#x201c;<article-title>Guidance document on the validation of (quantitative) structure-activity relationship [(Q)SAR] models</article-title>,&#x201d; in <source>OECD series on testing and assessment</source>. <publisher-loc>Paris</publisher-loc>.</citation>
</ref>
<ref id="B88">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pang</surname>
<given-names>X. D.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>X. J.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>Y. Z.</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>H. M.</given-names>
</name>
<etal/>
</person-group> (<year>2025</year>). <article-title>NeuTox 2.0: a hybrid deep learning architecture for screening potential neurotoxicity of chemicals based on multimodal feature fusion</article-title>. <source>Environ. Int.</source> <volume>195</volume>, <fpage>109244</fpage>. <pub-id pub-id-type="doi">10.1016/j.envint.2024.109244</pub-id>
</citation>
</ref>
<ref id="B89">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Papamokos</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Silins</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Combining QSAR modeling and text-mining techniques to link chemical structures and carcinogenic modes of action</article-title>. <source>Front. Pharmacol.</source> <volume>7</volume>, <fpage>284</fpage>. <pub-id pub-id-type="doi">10.3389/fphar.2016.00284</pub-id>
</citation>
</ref>
<ref id="B90">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Pei</surname>
<given-names>Q. Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>J. H.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>K. H.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>K. Y.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>L. J.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). &#x201c;<article-title>BioT5: enriching cross-modal integration in biology with chemical knowledge and natural language associations</article-title>,&#x201d; in <conf-name>2023 Conference on Empirical Methods in Natural Language Processing, Emnlp 2023</conf-name>, <conf-loc>Singapore</conf-loc>, <conf-date>December 6&#x2013;10, 2023</conf-date>, <fpage>1102</fpage>&#x2013;<lpage>1123</lpage>.</citation>
</ref>
<ref id="B91">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pognan</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Beilmann</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Boonen</surname>
<given-names>H. C. M.</given-names>
</name>
<name>
<surname>Czich</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Dear</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Hewitt</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>The evolving role of investigative toxicology in the pharmaceutical industry</article-title>. <source>Nat. Rev. Drug Discov.</source> <volume>22</volume> (<issue>4</issue>), <fpage>317</fpage>&#x2013;<lpage>335</lpage>. <pub-id pub-id-type="doi">10.1038/s41573-022-00633-x</pub-id>
</citation>
</ref>
<ref id="B92">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Quinton</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Latry</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Biour</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>1993</year>). <article-title>Hepatox(C) - a database about hepatotoxic drugs</article-title>. <source>Gastroenterologie Clinique Biol.</source> <volume>17</volume> (<issue>5bis</issue>), <fpage>H116</fpage>&#x2013;<lpage>H120</lpage>.</citation>
</ref>
<ref id="B93">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rao</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Nassiri</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Alhambra</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Snoeys</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Van Goethem</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Irrechukwu</surname>
<given-names>O.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>AI/ML models to predict the severity of drug-induced liver injury for small molecules</article-title>. <source>Chem. Res. Toxicol.</source> <volume>36</volume> (<issue>7</issue>), <fpage>1129</fpage>&#x2013;<lpage>1139</lpage>. <pub-id pub-id-type="doi">10.1021/acs.chemrestox.3c00098</pub-id>
</citation>
</ref>
<ref id="B94">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Regev</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Drug-induced liver injury and drug development: industry perspective</article-title>. <source>Seminars Liver Dis.</source> <volume>34</volume> (<issue>2</issue>), <fpage>227</fpage>&#x2013;<lpage>239</lpage>. <pub-id pub-id-type="doi">10.1055/s-0034-1375962</pub-id>
</citation>
</ref>
<ref id="B95">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reiser</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Neubert</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Eberhard</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Torresi</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Shao</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Graph neural networks for materials science and chemistry</article-title>. <source>Commun. Mater.</source> <volume>3</volume> (<issue>1</issue>), <fpage>93</fpage>. <pub-id pub-id-type="doi">10.1038/s43246-022-00315-6</pub-id>
</citation>
</ref>
<ref id="B96">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ren</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Atyah</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W. Y.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>C. H.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>The various aspects of genetic and epigenetic toxicology: testing methods and clinical applications</article-title>. <source>J. Transl. Med.</source> <volume>15</volume>, <fpage>110</fpage>. <pub-id pub-id-type="doi">10.1186/s12967-017-1218-4</pub-id>
</citation>
</ref>
<ref id="B97">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Richard</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>R. L.</given-names>
</name>
<name>
<surname>Waidyanatha</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Shinn</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Collins</surname>
<given-names>B. J.</given-names>
</name>
<name>
<surname>Thillainadarajah</surname>
<given-names>I.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>The Tox21 10K compound library: collaborative chemistry advancing toxicology</article-title>. <source>Chem. Res. Toxicol.</source> <volume>34</volume> (<issue>2</issue>), <fpage>189</fpage>&#x2013;<lpage>216</lpage>. <pub-id pub-id-type="doi">10.1021/acs.chemrestox.0c00264</pub-id>
</citation>
</ref>
<ref id="B98">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Richard</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Judson</surname>
<given-names>R. S.</given-names>
</name>
<name>
<surname>Houck</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Grulke</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>Volarath</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Thillainadarajah</surname>
<given-names>I.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>ToxCast chemical landscape: paving the road to 21st century toxicology</article-title>. <source>Chem. Res. Toxicol.</source> <volume>29</volume> (<issue>8</issue>), <fpage>1225</fpage>&#x2013;<lpage>1251</lpage>. <pub-id pub-id-type="doi">10.1021/acs.chemrestox.6b00135</pub-id>
</citation>
</ref>
<ref id="B99">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rodr&#xed;guez-P&#xe9;rez</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Bajorath</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Interpretation of machine learning models using shapley values: application to compound potency and multi-target activity predictions</article-title>. <source>J. Computer-Aided Mol. Des.</source> <volume>34</volume> (<issue>10</issue>), <fpage>1013</fpage>&#x2013;<lpage>1026</lpage>. <pub-id pub-id-type="doi">10.1007/s10822-020-00314-0</pub-id>
</citation>
</ref>
<ref id="B100">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ryu</surname>
<given-names>J. Y.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>M. Y.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>J. H.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>B. H.</given-names>
</name>
<name>
<surname>Oh</surname>
<given-names>K. S.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>DeepHIT: a deep learning framework for prediction of hERG-induced cardiotoxicity</article-title>. <source>Bioinformatics</source> <volume>36</volume> (<issue>10</issue>), <fpage>3049</fpage>&#x2013;<lpage>3055</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btaa075</pub-id>
</citation>
</ref>
<ref id="B101">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schrenk</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>What is the meaning of &#x27;A compound is carcinogenic</article-title>. <source>Toxicol. Rep.</source> <volume>5</volume>, <fpage>504</fpage>&#x2013;<lpage>511</lpage>. <pub-id pub-id-type="doi">10.1016/j.toxrep.2018.04.002</pub-id>
</citation>
</ref>
<ref id="B102">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schwaller</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Laino</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Gaudin</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Bolgar</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Hunter</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Bekas</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Molecular transformer: a model for uncertainty-calibrated chemical reaction prediction</article-title>. <source>Acs Central Sci.</source> <volume>5</volume> (<issue>9</issue>), <fpage>1572</fpage>&#x2013;<lpage>1583</lpage>. <pub-id pub-id-type="doi">10.1021/acscentsci.9b00576</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Seal</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Williams</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Hosseini-Gerami</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Mahale</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Carpenter</surname>
<given-names>A. E.</given-names>
</name>
<name>
<surname>Spjuth</surname>
<given-names>O.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Improved detection of drug-induced liver injury by integrating predicted and experimental data</article-title>. <source>Chem. Res. Toxicol.</source> <volume>37</volume> (<issue>8</issue>), <fpage>1290</fpage>&#x2013;<lpage>1305</lpage>. <pub-id pub-id-type="doi">10.1021/acs.chemrestox.4c00015</pub-id>
</citation>
</ref>
<ref id="B103">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shi</surname>
<given-names>Y. P.</given-names>
</name>
<name>
<surname>Hua</surname>
<given-names>Y. Q.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>B. B.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>R. Q.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>
<italic>In silico</italic> prediction and insights into the structural basis of drug induced nephrotoxicity</article-title>. <source>Front. Pharmacol.</source> <volume>12</volume>, <fpage>793332</fpage>. <pub-id pub-id-type="doi">10.3389/fphar.2021.793332</pub-id>
</citation>
</ref>
<ref id="B104">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shinada</surname>
<given-names>N. K.</given-names>
</name>
<name>
<surname>Koyama</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Ikemori</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Nishioka</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Hitaoka</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Hakura</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Optimizing machine-learning models for mutagenicity prediction through better feature selection</article-title>. <source>Mutagenesis</source> <volume>37</volume> (<issue>3-4</issue>), <fpage>191</fpage>&#x2013;<lpage>202</lpage>. <pub-id pub-id-type="doi">10.1093/mutage/geac010</pub-id>
</citation>
</ref>
<ref id="B105">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Storchi</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Cruciani</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Cross</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>DeepGRID: deep learning using GRID descriptors for BBB prediction</article-title>. <source>J. Chem. Inf. Model.</source> <volume>63</volume> (<issue>17</issue>), <fpage>5496</fpage>&#x2013;<lpage>5512</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jcim.3c00768</pub-id>
</citation>
</ref>
<ref id="B106">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Nie</surname>
<given-names>F. L.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>A merged molecular representation deep learning method for blood-brain barrier permeability prediction</article-title>. <source>Briefings Bioinforma.</source> <volume>23</volume> (<issue>5</issue>), <fpage>bbac357</fpage>. <pub-id pub-id-type="doi">10.1093/bib/bbac357</pub-id>
</citation>
</ref>
<ref id="B107">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thakkar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z. C.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>L. H.</given-names>
</name>
<name>
<surname>Roberts</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>W. D.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Drug-induced liver injury severity and toxicity (DILIst): binary classification of 1279 drugs by human hepatotoxicity</article-title>. <source>Drug Discov. Today</source> <volume>25</volume> (<issue>1</issue>), <fpage>201</fpage>&#x2013;<lpage>208</lpage>. <pub-id pub-id-type="doi">10.1016/j.drudis.2019.09.022</pub-id>
</citation>
</ref>
<ref id="B108">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tibo</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>J. Z.</given-names>
</name>
<name>
<surname>Janet</surname>
<given-names>J. P.</given-names>
</name>
<name>
<surname>Nittinger</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Engkvist</surname>
<given-names>O.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Exhaustive local chemical space exploration using a transformer model</article-title>. <source>Nat. Commun.</source> <volume>15</volume> (<issue>1</issue>), <fpage>7315</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-024-51672-4</pub-id>
</citation>
</ref>
<ref id="B109">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Valentine</surname>
<given-names>W. M.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Toxic peripheral neuropathies: agents and mechanisms</article-title>. <source>Toxicol. Pathol.</source> <volume>48</volume> (<issue>1</issue>), <fpage>152</fpage>&#x2013;<lpage>173</lpage>. <pub-id pub-id-type="doi">10.1177/0192623319854326</pub-id>
</citation>
</ref>
<ref id="B110">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vamathevan</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Clark</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Czodrowski</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Dunham</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Ferran</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Applications of machine learning in drug discovery and development</article-title>. <source>Nat. Rev. Drug Discov.</source> <volume>18</volume> (<issue>6</issue>), <fpage>463</fpage>&#x2013;<lpage>477</lpage>. <pub-id pub-id-type="doi">10.1038/s41573-019-0024-5</pub-id>
</citation>
</ref>
<ref id="B111">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Venkatraman</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>FP-ADMET: a compendium of fingerprint-based ADMET prediction models</article-title>. <source>J. Cheminformatics</source> <volume>13</volume> (<issue>1</issue>), <fpage>75</fpage>. <pub-id pub-id-type="doi">10.1186/s13321-021-00557-5</pub-id>
</citation>
</ref>
<ref id="B112">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Villeneuve</surname>
<given-names>D. L.</given-names>
</name>
<name>
<surname>Crump</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Garcia-Reyero</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Hecker</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Hutchinson</surname>
<given-names>T. H.</given-names>
</name>
<name>
<surname>LaLone</surname>
<given-names>C. A.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Adverse outcome pathway (AOP) development I: strategies and principles</article-title>. <source>Toxicol. Sci.</source> <volume>142</volume> (<issue>2</issue>), <fpage>312</fpage>&#x2013;<lpage>320</lpage>. <pub-id pub-id-type="doi">10.1093/toxsci/kfu199</pub-id>
</citation>
</ref>
<ref id="B113">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Walker</surname>
<given-names>P. A.</given-names>
</name>
<name>
<surname>Ryder</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Lavado</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Dilworth</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Riley</surname>
<given-names>R. J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>The evolution of strategies to minimise the risk of human drug-induced liver injury (DILI) in drug discovery and development</article-title>. <source>Archives Toxicol.</source> <volume>94</volume> (<issue>8</issue>), <fpage>2559</fpage>&#x2013;<lpage>2585</lpage>. <pub-id pub-id-type="doi">10.1007/s00204-020-02763-w</pub-id>
</citation>
</ref>
<ref id="B114">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>S. Q.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>H. Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y. Y.</given-names>
</name>
<name>
<surname>Hou</surname>
<given-names>T. J.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>ADMET evaluation in drug discovery. 16. Predicting hERG blockers by combining multiple pharmacophores and machine learning approaches</article-title>. <source>Mol. Pharm.</source> <volume>13</volume> (<issue>8</issue>), <fpage>2855</fpage>&#x2013;<lpage>2866</lpage>. <pub-id pub-id-type="doi">10.1021/acs.molpharmaceut.6b00471</pub-id>
</citation>
</ref>
<ref id="B115">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>T. Y.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>J. Q.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>Q.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Investigating cardiotoxicity related with hERG channel blockers using molecular fingerprints and graph attention mechanism</article-title>. <source>Comput. Biol. Med.</source> <volume>153</volume>, <fpage>106464</fpage>. <pub-id pub-id-type="doi">10.1016/j.compbiomed.2022.106464</pub-id>
</citation>
</ref>
<ref id="B116">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Y. M.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>M. T.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>W. H.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Z. R.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Identification of vital chemical information via visualization of graph neural networks</article-title>. <source>Briefings Bioinforma.</source> <volume>24</volume> (<issue>1</issue>), <fpage>bbac577</fpage>. <pub-id pub-id-type="doi">10.1093/bib/bbac577</pub-id>
</citation>
</ref>
<ref id="B117">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wellawatte</surname>
<given-names>G. P.</given-names>
</name>
<name>
<surname>Seshadri</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>White</surname>
<given-names>A. D.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Model agnostic generation of counterfactual explanations for molecules</article-title>. <source>Chem. Sci.</source> <volume>13</volume> (<issue>13</issue>), <fpage>3697</fpage>&#x2013;<lpage>3705</lpage>. <pub-id pub-id-type="doi">10.1039/d1sc05259d</pub-id>
</citation>
</ref>
<ref id="B118">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Rush</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Panickan</surname>
<given-names>V. A.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X. Y.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>T. R.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Multimodal representation learning for predicting molecule-disease relations</article-title>. <source>Bioinformatics</source> <volume>39</volume> (<issue>2</issue>), <fpage>btad085</fpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btad085</pub-id>
</citation>
</ref>
<ref id="B119">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wigh</surname>
<given-names>D. S.</given-names>
</name>
<name>
<surname>Goodman</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Lapkin</surname>
<given-names>A. A.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>A review of molecular representation in the age of machine learning</article-title>. <source>Wiley Interdiscip. Reviews-Computational Mol. Sci.</source> <volume>12</volume> (<issue>5</issue>), <fpage>e1603</fpage>. <pub-id pub-id-type="doi">10.1002/wcms.1603</pub-id>
</citation>
</ref>
<ref id="B120">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wishart</surname>
<given-names>D. S.</given-names>
</name>
<name>
<surname>Feunang</surname>
<given-names>Y. D.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>A. C.</given-names>
</name>
<name>
<surname>Lo</surname>
<given-names>E. J.</given-names>
</name>
<name>
<surname>Marcu</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Grant</surname>
<given-names>J. R.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>DrugBank 5.0: a major update to the DrugBank database for 2018</article-title>. <source>Nucleic Acids Res.</source> <volume>46</volume> (<issue>D1</issue>), <fpage>D1074</fpage>&#x2013;<lpage>D1082</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkx1037</pub-id>
</citation>
</ref>
<ref id="B121">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>L. L.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>B. W.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>TOXRIC: a comprehensive database of toxicological data and benchmarks</article-title>. <source>Nucleic Acids Res.</source> <volume>51</volume> (<issue>D1</issue>), <fpage>D1432</fpage>&#x2013;<lpage>D1445</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkac1074</pub-id>
</citation>
</ref>
<ref id="B122">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>W. X.</given-names>
</name>
<name>
<surname>Qian</surname>
<given-names>J. Y.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>C. J.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>J. Y.</given-names>
</name>
<name>
<surname>Ge</surname>
<given-names>G. B.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Q. P.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>GeoDILI: a robust and interpretable model for drug-induced liver injury prediction using graph neural network-based molecular geometric representation</article-title>. <source>Chem. Res. Toxicol.</source> <volume>36</volume> (<issue>11</issue>), <fpage>1717</fpage>&#x2013;<lpage>1730</lpage>. <pub-id pub-id-type="doi">10.1021/acs.chemrestox.3c00199</pub-id>
</citation>
</ref>
<ref id="B123">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>Z. X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J. K.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>H. Y.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Kang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Chemistry-intuitive explanation of graph neural networks for molecular property prediction with substructure masking</article-title>. <source>Nat. Commun.</source> <volume>14</volume> (<issue>1</issue>), <fpage>2585</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-023-38192-3</pub-id>
</citation>
</ref>
<ref id="B124">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>C. Y.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>F. X.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>W. H.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>G. X.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>
<italic>In silico</italic> prediction of chemical ames mutagenicity</article-title>. <source>J. Chem. Inf. Model.</source> <volume>52</volume> (<issue>11</issue>), <fpage>2840</fpage>&#x2013;<lpage>2847</lpage>. <pub-id pub-id-type="doi">10.1021/ci300400a</pub-id>
</citation>
</ref>
<ref id="B125">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>H. Y.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>Y. P.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y. X.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>Zan</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Deep active learning with high structural discriminability for molecular mutagenicity prediction</article-title>. <source>Commun. Biol.</source> <volume>7</volume> (<issue>1</issue>), <fpage>1071</fpage>. <pub-id pub-id-type="doi">10.1038/s42003-024-06758-6</pub-id>
</citation>
</ref>
<ref id="B126">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>J. H. J.</given-names>
</name>
<name>
<surname>Henstock</surname>
<given-names>P. V.</given-names>
</name>
<name>
<surname>Dunn</surname>
<given-names>M. C.</given-names>
</name>
<name>
<surname>Smith</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Chabot</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>de Graaf</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Cellular imaging predictions of clinical drug-induced liver injury</article-title>. <source>Toxicol. Sci.</source> <volume>105</volume> (<issue>1</issue>), <fpage>97</fpage>&#x2013;<lpage>105</lpage>. <pub-id pub-id-type="doi">10.1093/toxsci/kfn109</pub-id>
</citation>
</ref>
<ref id="B127">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>P. C.</given-names>
</name>
<name>
<surname>Ji</surname>
<given-names>X. B.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>W. C.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Small data machine learning in materials science</article-title>. <source>Npj Comput. Mater.</source> <volume>9</volume> (<issue>1</issue>), <fpage>42</fpage>. <pub-id pub-id-type="doi">10.1038/s41524-023-01000-z</pub-id>
</citation>
</ref>
<ref id="B128">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>Y. J.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>Z. W.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>F. J.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>S. S.</given-names>
</name>
<name>
<surname>Pei</surname>
<given-names>J. F.</given-names>
</name>
<name>
<surname>Lai</surname>
<given-names>L. H.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Deep learning for drug-induced liver injury</article-title>. <source>J. Chem. Inf. Model.</source> <volume>55</volume> (<issue>10</issue>), <fpage>2085</fpage>&#x2013;<lpage>2093</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jcim.5b00238</pub-id>
</citation>
</ref>
<ref id="B129">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yan</surname>
<given-names>B. W.</given-names>
</name>
<name>
<surname>Ye</surname>
<given-names>X. N.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>L. L.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>An algorithm framework for drug-induced liver injury prediction based on genetic algorithm and ensemble learning</article-title>. <source>Molecules</source> <volume>27</volume> (<issue>10</issue>), <fpage>3112</fpage>. <pub-id pub-id-type="doi">10.3390/molecules27103112</pub-id>
</citation>
</ref>
<ref id="B130">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>H. B.</given-names>
</name>
<name>
<surname>Lou</surname>
<given-names>C. F.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>L. X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>Y. C.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>admetSAR 2.0: web-service for prediction and optimization of chemical ADMET properties</article-title>. <source>Bioinformatics</source> <volume>35</volume> (<issue>6</issue>), <fpage>1067</fpage>&#x2013;<lpage>1069</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bty707</pub-id>
</citation>
</ref>
<ref id="B131">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>P. C.</given-names>
</name>
<name>
<surname>DeMarco</surname>
<given-names>K. R.</given-names>
</name>
<name>
<surname>Aghasafari</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Jeng</surname>
<given-names>M. T.</given-names>
</name>
<name>
<surname>Dawson</surname>
<given-names>J. R. D.</given-names>
</name>
<name>
<surname>Bekker</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>A computational pipeline to predict cardiotoxicity from the atom to the rhythm</article-title>. <source>Circulation Res.</source> <volume>126</volume> (<issue>8</issue>), <fpage>947</fpage>&#x2013;<lpage>964</lpage>. <pub-id pub-id-type="doi">10.1161/Circresaha.119.316404</pub-id>
</citation>
</ref>
<ref id="B132">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>T. B.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>X. Y.</given-names>
</name>
<name>
<surname>Mcmichael</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Pun</surname>
<given-names>F. W.</given-names>
</name>
<name>
<surname>Aliper</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ren</surname>
<given-names>F.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>AttenhERG: a reliable and interpretable graph neural network framework for predicting hERG channel blockers</article-title>. <source>J. Cheminformatics</source> <volume>16</volume> (<issue>1</issue>), <fpage>143</fpage>. <pub-id pub-id-type="doi">10.1186/s13321-024-00940-y</pub-id>
</citation>
</ref>
<ref id="B133">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Ying</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Bourgeois</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>You</surname>
<given-names>J. X.</given-names>
</name>
<name>
<surname>Zitnik</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Leskovec</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2019</year>). &#x201c;<article-title>GNNExplainer: generating explanations for graph neural networks</article-title>,&#x201d; in <conf-name>Proceedings of the 33rd Conference on Neural Information Processing Systems NeurIPS</conf-name>, <conf-loc>Vancouver, Canada</conf-loc>, <conf-date>8-14 December 2019</conf-date>, <fpage>9240</fpage>&#x2013;<lpage>9251</lpage>.</citation>
</ref>
<ref id="B134">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yu</surname>
<given-names>M.-S.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Cho</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Oh</surname>
<given-names>K.-S.</given-names>
</name>
<name>
<surname>Jang</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2025</year>). <article-title>hERGBoost: a gradient boosting model for quantitative IC50 prediction of hERG channel blockers</article-title>. <source>Comput. Biol. Med.</source> <volume>184</volume>, <fpage>109416</fpage>. <pub-id pub-id-type="doi">10.1016/j.compbiomed.2024.109416</pub-id>
</citation>
</ref>
<ref id="B135">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Ren</surname>
<given-names>J. X.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>J. X.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Development of an <italic>in silico</italic> prediction model for chemical-induced urinary tract toxicity by using naive Bayes classifier</article-title>. <source>Mol. Divers.</source> <volume>23</volume> (<issue>2</issue>), <fpage>381</fpage>&#x2013;<lpage>392</lpage>. <pub-id pub-id-type="doi">10.1007/s11030-018-9882-8</pub-id>
</citation>
</ref>
<ref id="B136">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>S. Z.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>Z. Y.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Y. Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>L. H.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>D. L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>HelixADMET: a robust and endpoint extensible ADMET system incorporating self-supervised knowledge transfer</article-title>. <source>Bioinformatics</source> <volume>38</volume> (<issue>13</issue>), <fpage>3444</fpage>&#x2013;<lpage>3453</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btac342</pub-id>
</citation>
</ref>
<ref id="B137">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>Y. M.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>J. N.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y. C.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>Y. R.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Prediction of hERG K&#x2b; channel blockage using deep neural networks</article-title>. <source>Chem. Biol. and Drug Des.</source> <volume>94</volume> (<issue>5</issue>), <fpage>1973</fpage>&#x2013;<lpage>1985</lpage>. <pub-id pub-id-type="doi">10.1111/cbdd.13600</pub-id>
</citation>
</ref>
<ref id="B138">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>Y. H.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>R. Q.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Z. Y.</given-names>
</name>
<name>
<surname>Hua</surname>
<given-names>Y. Q.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Machine learning modeling and insights into the structural characteristics of drug-induced neurotoxicity</article-title>. <source>J. Chem. Inf. Model.</source> <volume>62</volume> (<issue>23</issue>), <fpage>6035</fpage>&#x2013;<lpage>6045</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jcim.2c01131</pub-id>
</citation>
</ref>
<ref id="B139">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zheng</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Y. D.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Identifying structure-property relationships through SMILES syntax analysis with self-attention mechanism</article-title>. <source>J. Chem. Inf. Model.</source> <volume>59</volume> (<issue>2</issue>), <fpage>914</fpage>&#x2013;<lpage>923</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jcim.8b00803</pub-id>
</citation>
</ref>
<ref id="B140">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Martin</surname>
<given-names>T. M.</given-names>
</name>
<name>
<surname>Ye</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Sedykh</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Young</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>Tropsha</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Quantitative structure-activity relationship modeling of rat acute toxicity by oral exposure</article-title>. <source>Chem. Res. Toxicol.</source> <volume>22</volume> (<issue>12</issue>), <fpage>1913</fpage>&#x2013;<lpage>1921</lpage>. <pub-id pub-id-type="doi">10.1021/tx900189p</pub-id>
</citation>
</ref>
</ref-list>
<sec id="s13">
<title>Glossary</title>
<def-list>
<def-item>
<term id="G1-fchem.2025.1632046">
<bold>ACC</bold>
</term>
<def>
<p>Accuracy</p>
</def>
</def-item>
<def-item>
<term id="G2-fchem.2025.1632046">
<bold>AEs</bold>
</term>
<def>
<p>Adverse Events</p>
</def>
</def-item>
<def-item>
<term id="G3-fchem.2025.1632046">
<bold>ADME</bold>
</term>
<def>
<p>Absorption, Distribution, Metabolism, and Excretion</p>
</def>
</def-item>
<def-item>
<term id="G4-fchem.2025.1632046">
<bold>ADMET</bold>
</term>
<def>
<p>Absorption, Distribution, Metabolism, Excretion, and Toxicity</p>
</def>
</def-item>
<def-item>
<term id="G5-fchem.2025.1632046">
<bold>AKI</bold>
</term>
<def>
<p>Acute Kidney Injury</p>
</def>
</def-item>
<def-item>
<term id="G6-fchem.2025.1632046">
<bold>AI</bold>
</term>
<def>
<p>Artificial Intelligence</p>
</def>
</def-item>
<def-item>
<term id="G7-fchem.2025.1632046">
<bold>AlogP</bold>
</term>
<def>
<p>Logarithm of Partition Coefficient</p>
</def>
</def-item>
<def-item>
<term id="G8-fchem.2025.1632046">
<bold>ANN</bold>
</term>
<def>
<p>Artificial Neural Network</p>
</def>
</def-item>
<def-item>
<term id="G9-fchem.2025.1632046">
<bold>AO</bold>
</term>
<def>
<p>Adverse Outcome</p>
</def>
</def-item>
<def-item>
<term id="G10-fchem.2025.1632046">
<bold>AOPs</bold>
</term>
<def>
<p>Adverse Outcome Pathways</p>
</def>
</def-item>
<def-item>
<term id="G11-fchem.2025.1632046">
<bold>AUROC</bold>
</term>
<def>
<p>Area Under the Receiver Operating Characteristic Curve</p>
</def>
</def-item>
<def-item>
<term id="G12-fchem.2025.1632046">
<bold>AUPRC</bold>
</term>
<def>
<p>Area Under the Precision&#x2013;Recall Curve</p>
</def>
</def-item>
<def-item>
<term id="G13-fchem.2025.1632046">
<bold>BAC</bold>
</term>
<def>
<p>Balanced Accuracy</p>
</def>
</def-item>
<def-item>
<term id="G14-fchem.2025.1632046">
<bold>BBB</bold>
</term>
<def>
<p>Blood&#x2013;Brain Barrier</p>
</def>
</def-item>
<def-item>
<term id="G15-fchem.2025.1632046">
<bold>CDK</bold>
</term>
<def>
<p>Chemistry Development Kit fingerprint</p>
</def>
</def-item>
<def-item>
<term id="G16-fchem.2025.1632046">
<bold>C4.5 DT</bold>
</term>
<def>
<p>C4.5 Decision Tree</p>
</def>
</def-item>
<def-item>
<term id="G17-fchem.2025.1632046">
<bold>CYP</bold>
</term>
<def>
<p>Cytochrome P450</p>
</def>
</def-item>
<def-item>
<term id="G18-fchem.2025.1632046">
<bold>CNN</bold>
</term>
<def>
<p>Convolutional Neural Network</p>
</def>
</def-item>
<def-item>
<term id="G19-fchem.2025.1632046">
<bold>DILI</bold>
</term>
<def>
<p>Drug-Induced Liver Injury</p>
</def>
</def-item>
<def-item>
<term id="G20-fchem.2025.1632046">
<bold>DIN</bold>
</term>
<def>
<p>Drug-Induced Nephrotoxicity</p>
</def>
</def-item>
<def-item>
<term id="G21-fchem.2025.1632046">
<bold>DMPNN</bold>
</term>
<def>
<p>Directed Message-Passing Neural Networks</p>
</def>
</def-item>
<def-item>
<term id="G22-fchem.2025.1632046">
<bold>DNN</bold>
</term>
<def>
<p>Deep Neural Network</p>
</def>
</def-item>
<def-item>
<term id="G23-fchem.2025.1632046">
<bold>ECFP</bold>
</term>
<def>
<p>Extended-Connectivity Fingerprint</p>
</def>
</def-item>
<def-item>
<term id="G24-fchem.2025.1632046">
<bold>EPA</bold>
</term>
<def>
<p>The U.S. Environmental Protection Agency</p>
</def>
</def-item>
<def-item>
<term id="G25-fchem.2025.1632046">
<bold>EHR</bold>
</term>
<def>
<p>Electronic Health Records</p>
</def>
</def-item>
<def-item>
<term id="G26-fchem.2025.1632046">
<bold>FCNN</bold>
</term>
<def>
<p>Fully Connected Neural Network</p>
</def>
</def-item>
<def-item>
<term id="G27-fchem.2025.1632046">
<bold>FDA</bold>
</term>
<def>
<p>The U.S. Food and Drug Administration</p>
</def>
</def-item>
<def-item>
<term id="G28-fchem.2025.1632046">
<bold>FP</bold>
</term>
<def>
<p>Fingerprint</p>
</def>
</def-item>
<def-item>
<term id="G29-fchem.2025.1632046">
<bold>GAT</bold>
</term>
<def>
<p>Graph Attention Networks</p>
</def>
</def-item>
<def-item>
<term id="G30-fchem.2025.1632046">
<bold>GCN</bold>
</term>
<def>
<p>Graph Convolutional Networks</p>
</def>
</def-item>
<def-item>
<term id="G31-fchem.2025.1632046">
<bold>GCNN</bold>
</term>
<def>
<p>Graph Convolutional Neural Network;</p>
</def>
</def-item>
<def-item>
<term id="G32-fchem.2025.1632046">
<bold>GeoGNN</bold>
</term>
<def>
<p>Geometry-based Graph Neural Network</p>
</def>
</def-item>
<def-item>
<term id="G33-fchem.2025.1632046">
<bold>GNN</bold>
</term>
<def>
<p>Graph Neural Network</p>
</def>
</def-item>
<def-item>
<term id="G34-fchem.2025.1632046">
<bold>GPU</bold>
</term>
<def>
<p>Graphics Processing Unit</p>
</def>
</def-item>
<def-item>
<term id="G35-fchem.2025.1632046">
<bold>GRU</bold>
</term>
<def>
<p>Gated Recurrent Unit</p>
</def>
</def-item>
<def-item>
<term id="G36-fchem.2025.1632046">
<bold>hERG</bold>
</term>
<def>
<p>Human Ether-&#xe0;-go-go Related Gene</p>
</def>
</def-item>
<def-item>
<term id="G37-fchem.2025.1632046">
<bold>HTS</bold>
</term>
<def>
<p>High-Throughput Screening</p>
</def>
</def-item>
<def-item>
<term id="G38-fchem.2025.1632046">
<bold>IC50</bold>
</term>
<def>
<p>Half Maximal Inhibitory Concentration</p>
</def>
</def-item>
<def-item>
<term id="G39-fchem.2025.1632046">
<bold>ICH</bold>
</term>
<def>
<p>The International Council for Harmonisation of Technical Requirements for Pharmaceuticals for Human Use</p>
</def>
</def-item>
<def-item>
<term id="G40-fchem.2025.1632046">
<bold>JAK</bold>
</term>
<def>
<p>Janus Kinase</p>
</def>
</def-item>
<def-item>
<term id="G41-fchem.2025.1632046">
<bold>KEs</bold>
</term>
<def>
<p>Key Events</p>
</def>
</def-item>
<def-item>
<term id="G42-fchem.2025.1632046">
<bold>kMedoids</bold>
</term>
<def>
<p>k-Medoids Clustering Algorithm</p>
</def>
</def-item>
<def-item>
<term id="G43-fchem.2025.1632046">
<bold>kNN</bold>
</term>
<def>
<p>k-Nearest Neighbor</p>
</def>
</def-item>
<def-item>
<term id="G44-fchem.2025.1632046">
<bold>LD50</bold>
</term>
<def>
<p>Lethal Dose for 50% of the Population</p>
</def>
</def-item>
<def-item>
<term id="G45-fchem.2025.1632046">
<bold>LGBM</bold>
</term>
<def>
<p>Light Gradient-Boosting Machine</p>
</def>
</def-item>
<def-item>
<term id="G46-fchem.2025.1632046">
<bold>LOAEL</bold>
</term>
<def>
<p>Lowest-Observed-Adverse-Effect Level</p>
</def>
</def-item>
<def-item>
<term id="G47-fchem.2025.1632046">
<bold>LR</bold>
</term>
<def>
<p>Linear Regression</p>
</def>
</def-item>
<def-item>
<term id="G48-fchem.2025.1632046">
<bold>LTKB</bold>
</term>
<def>
<p>Liver Toxicity Knowledge Base</p>
</def>
</def-item>
<def-item>
<term id="G49-fchem.2025.1632046">
<bold>MACCS</bold>
</term>
<def>
<p>Molecular ACCess System</p>
</def>
</def-item>
<def-item>
<term id="G50-fchem.2025.1632046">
<bold>MAE</bold>
</term>
<def>
<p>Mean Absolute Error</p>
</def>
</def-item>
<def-item>
<term id="G51-fchem.2025.1632046">
<bold>MAPE</bold>
</term>
<def>
<p>Mean Absolute Percentage Error</p>
</def>
</def-item>
<def-item>
<term id="G52-fchem.2025.1632046">
<bold>MCC</bold>
</term>
<def>
<p>Matthews Correlation Coefficient</p>
</def>
</def-item>
<def-item>
<term id="G53-fchem.2025.1632046">
<bold>MIEs</bold>
</term>
<def>
<p>Molecular initiating events</p>
</def>
</def-item>
<def-item>
<term id="G54-fchem.2025.1632046">
<bold>MMP</bold>
</term>
<def>
<p>Matrix metalloproteinase</p>
</def>
</def-item>
<def-item>
<term id="G55-fchem.2025.1632046">
<bold>MTT</bold>
</term>
<def>
<p>3-(4,5-Dimethylthiazol-2-yl)-2,5-Diphenyltetrazolium Bromide Assay</p>
</def>
</def-item>
<def-item>
<term id="G57-fchem.2025.1632046">
<bold>NCTR</bold>
</term>
<def>
<p>National Center for Toxicological Research</p>
</def>
</def-item>
<def-item>
<term id="G58-fchem.2025.1632046">
<bold>NOAEL</bold>
</term>
<def>
<p>No-Observed-Adverse-Effect Level</p>
</def>
</def-item>
<def-item>
<term id="G59-fchem.2025.1632046">
<bold>NSAIDs</bold>
</term>
<def>
<p>Non-Steroidal Anti-Inflammatory Drugs</p>
</def>
</def-item>
<def-item>
<term id="G60-fchem.2025.1632046">
<bold>OECD</bold>
</term>
<def>
<p>Organization for Economic Co-operation and Development</p>
</def>
</def-item>
<def-item>
<term id="G61-fchem.2025.1632046">
<bold>OECD TA</bold>
</term>
<def>
<p>OECD Toxicity Assays</p>
</def>
</def-item>
<def-item>
<term id="G62-fchem.2025.1632046">
<bold>PK</bold>
</term>
<def>
<p>Pharmacokinetic</p>
</def>
</def-item>
<def-item>
<term id="G63-fchem.2025.1632046">
<bold>PPB</bold>
</term>
<def>
<p>Plasma Protein Binding</p>
</def>
</def-item>
<def-item>
<term id="G64-fchem.2025.1632046">
<bold>PRC</bold>
</term>
<def>
<p>Precision&#x2013;Recall Curve</p>
</def>
</def-item>
<def-item>
<term id="G65-fchem.2025.1632046">
<bold>QNPR</bold>
</term>
<def>
<p>Quantitative Name&#x2013;Property Relationship</p>
</def>
</def-item>
<def-item>
<term id="G66-fchem.2025.1632046">
<bold>QSAR</bold>
</term>
<def>
<p>Quantitative Structure&#x2013;Activity Relationship</p>
</def>
</def-item>
<def-item>
<term id="G67-fchem.2025.1632046">
<bold>RF</bold>
</term>
<def>
<p>Random Forest</p>
</def>
</def-item>
<def-item>
<term id="G68-fchem.2025.1632046">
<bold>RMSE</bold>
</term>
<def>
<p>Root Mean Square Error</p>
</def>
</def-item>
<def-item>
<term id="G69-fchem.2025.1632046">
<bold>SGAT</bold>
</term>
<def>
<p>SMILES Graph Attention Network</p>
</def>
</def-item>
<def-item>
<term id="G70-fchem.2025.1632046">
<bold>SHAP</bold>
</term>
<def>
<p>SHapley Additive exPlanations</p>
</def>
</def-item>
<def-item>
<term id="G71-fchem.2025.1632046">
<bold>SIDER</bold>
</term>
<def>
<p>Side Effect Resource</p>
</def>
</def-item>
<def-item>
<term id="G72-fchem.2025.1632046">
<bold>SMILES</bold>
</term>
<def>
<p>Simplified Molecular Input Line Entry System</p>
</def>
</def-item>
<def-item>
<term id="G73-fchem.2025.1632046">
<bold>SMOTE</bold>
</term>
<def>
<p>Synthetic Minority Over-sampling Technique</p>
</def>
</def-item>
<def-item>
<term id="G74-fchem.2025.1632046">
<bold>SVM</bold>
</term>
<def>
<p>Support Vector Machine</p>
</def>
</def-item>
<def-item>
<term id="G75-fchem.2025.1632046">
<bold>XGBoost</bold>
</term>
<def>
<p>Extreme Gradient Boosting</p>
</def>
</def-item>
</def-list>
</sec>
</back>
</article>