<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Artif. Intell.</journal-id>
<journal-title>Frontiers in Artificial Intelligence</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Artif. Intell.</abbrev-journal-title>
<issn pub-type="epub">2624-8212</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/frai.2025.1624797</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Artificial Intelligence</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Conversational AI agent for precision oncology: AI-HOPE-WNT integrates clinical and genomic data to investigate WNT pathway dysregulation in colorectal cancer</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Yang</surname> <given-names>Ei-Wen</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Waldrup</surname> <given-names>Brigette</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Velazquez-Villarreal</surname> <given-names>Enrique</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2873387/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>PolyAgent</institution>, <addr-line>San Francisco, CA</addr-line>, <country>United States</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Integrative Translational Sciences, Beckman Research Institute of City of Hope</institution>, <addr-line>Duarte, CA</addr-line>, <country>United States</country></aff>
<aff id="aff3"><sup>3</sup><institution>City of Hope Comprehensive Cancer Center</institution>, <addr-line>Duarte, CA</addr-line>, <country>United States</country></aff>
<author-notes>
<fn fn-type="edited-by" id="fn0001">
<p>Edited by: Francesco Napolitano, University of Sannio, Italy</p></fn>
<fn fn-type="edited-by" id="fn0002">
<p>Reviewed by: Wenzheng Bao, Xuzhou University of Technology, China</p>
<p>Emre Sefer, &#x00D6;zye&#x011F;in University, T&#x00FC;rkiye</p>
<p>Alexis Germ&#x00E1;n Murillo Carrasco, University of S&#x00E3;o Paulo, Brazil</p></fn>
<corresp id="c001">&#x002A;Correspondence: Enrique Velazquez-Villarreal, <email>evelazquezvilla@coh.org</email></corresp>
</author-notes>
<pub-date pub-type="epub">
<day>11</day>
<month>08</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>8</volume>
<elocation-id>1624797</elocation-id>
<history>
<date date-type="received">
<day>07</day>
<month>05</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>15</day>
<month>07</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2025 Yang, Waldrup and Velazquez-Villarreal.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Yang, Waldrup and Velazquez-Villarreal</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec id="sec1">
<title>Introduction</title>
<p>The WNT signaling pathway is a key driver of colorectal cancer (CRC) initiation and progression, particularly in early-onset CRC (EOCRC) among underserved populations. However, interrogating WNT pathway dysregulation across clinical and genomic dimensions remains technically challenging, limiting both translational insight and personalized intervention strategies. To address this gap, we developed AI-HOPE-WNT, the first conversational artificial intelligence (AI) agent purpose-built to investigate WNT signaling in CRC using natural language&#x2013;driven, integrative bioinformatics.</p>
</sec>
<sec id="sec2">
<title>Methods</title>
<p>AI-HOPE-WNT employs a modular architecture combining large language models (LLMs), a natural language-to-code engine, and a backend statistical workflow interfaced with harmonized data from cBioPortal. Unlike general-purpose platforms, AI-HOPE-WNT is uniquely optimized for WNT-specific precision oncology. The tool supports mutation frequency analysis, odds ratio testing, survival modeling, and subgroup stratification by genomic, clinical, and demographic variables. To validate the platform, we recapitulated findings from two previous studies examining WNT pathway alterations in high-risk CRC populations, including mutation prevalence in RNF43 and AXIN2 and survival outcomes associated with WNT pathway status across ethnic and age subgroups. Exploratory queries further assessed treatment response, co-mutation patterns, and population-specific trends.</p>
</sec>
<sec id="sec3">
<title>Results</title>
<p>In recapitulation analyses, AI-HOPE-WNT reproduced key trends from prior work, including improved survival in WNT-altered EOCRC and higher RNF43 mutation rates in Hispanic/Latino (H/L) populations compared to non-Hispanic White (NHW) people. Exploratory analyses revealed several novel findings. Among FOLFOX-treated EOCRC patients, APC mutations were associated with significantly different survival outcomes (<italic>p</italic>&#x202F;=&#x202F;0.043). RNF43-mutant tumors showed worse survival in metastatic versus primary cases (<italic>p</italic>&#x202F;=&#x202F;0.028). AXIN1 and APC co-mutations demonstrated location-specific enrichment between colon and rectal tumors. Gender-based differences in AXIN2-mutant cases under varying MSI status yielded significant survival variation (<italic>p</italic>&#x202F;=&#x202F;0.036). Additionally, patients under 50 with APC-mutant primary tumors showed worse survival (<italic>p</italic>&#x202F;=&#x202F;0.031) and increased mutation prevalence.</p>
</sec>
<sec id="sec4">
<title>Conclusion</title>
<p>AI-HOPE-WNT is the first dedicated AI platform for WNT pathway analysis in CRC. By combining natural language interaction with automated, high-throughput bioinformatics, it democratizes access to pathway-specific precision oncology research. The platform is freely available at: <uri xlink:href="https://github.com/Velazquez-Villarreal-Lab/AI-HOPE-WNT">https://github.com/Velazquez-Villarreal-Lab/AI-HOPE-WNT</uri>.</p>
</sec>
</abstract>
<kwd-group>
<kwd>artificial intelligence</kwd>
<kwd>AI agent</kwd>
<kwd>precision oncology</kwd>
<kwd>large language model (LLM)</kwd>
<kwd>medical AI</kwd>
<kwd>healthcare AI</kwd>
<kwd>colorectal cancer</kwd>
<kwd>WNT pathway</kwd>
</kwd-group>
<counts>
<fig-count count="5"/>
<table-count count="0"/>
<equation-count count="3"/>
<ref-count count="39"/>
<page-count count="11"/>
<word-count count="7374"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Medicine and Public Health</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec5">
<title>Introduction</title>
<p>Colorectal cancer (CRC) remains one of the most common and deadly malignancies worldwide, with early-onset CRC (EOCRC) rising at an alarming rate&#x2014;particularly among populations at higher risk (<xref ref-type="bibr" rid="ref27">Sung et al., 2021</xref>; <xref ref-type="bibr" rid="ref25">Sinicrope, 2022</xref>; <xref ref-type="bibr" rid="ref29">Ullah et al., 2023</xref>; <xref ref-type="bibr" rid="ref17">Garcia et al., 2018</xref>). While molecular alterations in the WNT signaling pathway are well established as drivers of CRC pathogenesis (<xref ref-type="bibr" rid="ref5">Bugter et al., 2021</xref>; <xref ref-type="bibr" rid="ref37">Zhang and Wang, 2020</xref>; <xref ref-type="bibr" rid="ref23">Sanchez-Vega et al., 2018</xref>), characterizing these alterations in EOCRC, especially within high-risk groups, has been hindered by data fragmentation, underrepresentation in genomic datasets, and technical barriers to integrative analysis (<xref ref-type="bibr" rid="ref21">Monge et al., 2024</xref>; <xref ref-type="bibr" rid="ref8">Carranza et al., 2024</xref>; <xref ref-type="bibr" rid="ref16">Ferrell et al., 2024</xref>).</p>
<p>The WNT signaling pathway is central to colorectal tumorigenesis, with mutations in genes such as APC, CTNNB1, RNF43, and AXIN2 promoting uncontrolled <italic>&#x03B2;</italic>-catenin activity and transcriptional reprogramming (<xref ref-type="bibr" rid="ref6">Cancer Genome Atlas Network, 2012</xref>; <xref ref-type="bibr" rid="ref15">Farooqi et al., 2019</xref>; <xref ref-type="bibr" rid="ref36">Yuan et al., 2020</xref>; <xref ref-type="bibr" rid="ref29">Ullah et al., 2023</xref>). Studies suggest that WNT pathway activation is nearly ubiquitous in CRC, yet its prognostic and therapeutic implications may vary by age and ethnicity (<xref ref-type="bibr" rid="ref9">Carranza et al., 2025</xref>; <xref ref-type="bibr" rid="ref1">Antelo et al., 2012</xref>; <xref ref-type="bibr" rid="ref19">Lieu et al., 2019</xref>; <xref ref-type="bibr" rid="ref20">Mauri et al., 2019</xref>). Notably, recent investigations by our group have identified elevated frequencies of RNF43 and AXIN2 mutations in EOCRC patients from high-risk populations, such as Hispanic/Latino (H/L) individuals, compared to non-Hispanic White (NHW) people. These studies also revealed that alterations in the WNT signaling pathway are associated with improved survival outcomes in EOCRC (<xref ref-type="bibr" rid="ref26">Song et al., 2023</xref>; <xref ref-type="bibr" rid="ref35">Youssef et al., 2025</xref>; <xref ref-type="bibr" rid="ref10">Cerami et al., 2012</xref>).</p>
<p>Despite the availability of high-dimensional datasets from platforms such as The Cancer Genome Atlas (TCGA) and AACR GENIE, most existing tools [e.g., cBioPortal (<xref ref-type="bibr" rid="ref10">Cerami et al., 2012</xref>), Xena (<xref ref-type="bibr" rid="ref18">Goldman et al., 2020</xref>)] operate through predefined graphical interfaces and require multi-step analytic pipelines. These constraints limit the ability of non-programmers to explore clinically relevant, pathway-specific questions&#x2014;particularly those involving demographic subgroups or treatment response contexts (<xref ref-type="bibr" rid="ref14">Eralp and Sefer, 2024</xref>).</p>
<p>Recent advances in artificial intelligence (AI), particularly large language models (LLMs), have led to conversational agents capable of translating natural language instructions into executable bioinformatics code (<xref ref-type="bibr" rid="ref31">Xiao et al., 2020</xref>; <xref ref-type="bibr" rid="ref28">Suresh and Misra, 2024</xref>; <xref ref-type="bibr" rid="ref7">Carl&#x00E0; et al., 2025</xref>; <xref ref-type="bibr" rid="ref30">Velez-Arce et al., 2024</xref>). While AI platforms that aim to fully automate multi-omic analysis (<xref ref-type="bibr" rid="ref39">Zhou et al., 2024</xref>) demonstrate the promise of LLMs for biomedical research and precision oncology (<xref ref-type="bibr" rid="ref4">Bhinder et al., 2021</xref>; <xref ref-type="bibr" rid="ref12">Chen et al., 2021</xref>; <xref ref-type="bibr" rid="ref38">Zhang and Wei, 2023</xref>; <xref ref-type="bibr" rid="ref24">Shimizu and Nakayama, 2020</xref>; <xref ref-type="bibr" rid="ref13">Chua et al., 2021</xref>; <xref ref-type="bibr" rid="ref3">Bhalla and Lagan&#x00E0;, 2022</xref>; <xref ref-type="bibr" rid="ref22">Monge et al., 2025</xref>), few tools are pathway-focused or optimized for integrating clinical and genomic data within a precision oncology framework.</p>
<p>To bridge these gaps, we introduce AI-HOPE-WNT (Artificial Intelligence agent for High-Optimization and Precision Medicine focused on WNT), a conversational AI system designed to study WNT pathway dysregulation in CRC through natural language queries. The platform integrates public CRC genomics and clinical data, automates analyses such as survival modeling and odds ratio testing, and supports hypothesis generation at scale. In this study, we (1) developed AI-HOPE-WNT to interactively query CRC datasets, (2) recapitulate its analytical performance by reproducing key trends from our prior WNT-focused disparity studies, and (3) demonstrated its capacity for novel discovery by exploring context-specific WNT interactions in EOCRC. Together, these efforts establish AI-HOPE-WNT as a scalable and accessible solution for integrative, pathway-driven cancer research.</p>
</sec>
<sec sec-type="methods" id="sec6">
<title>Methods</title>
<sec id="sec7">
<title>AI-HOPE-WNT system architecture and workflow</title>
<p>AI-HOPE-WNT (Artificial Intelligence agent for High-Optimization and Precision Medicine focused on WNT) is a conversational AI platform purpose-built for investigating CRC through the lens of WNT pathway dysregulation. It utilizes a modular architecture composed of LLMs, a natural language-to-code translation engine, and a backend analytics pipeline that enables real-time case&#x2013;control analysis and hypothesis generation. Upon user input via natural language, the system performs automated query parsing, data retrieval, statistical testing, and visualization (<xref ref-type="fig" rid="fig1">Figure 1</xref>). Output includes Kaplan&#x2013;Meier survival curves, odds ratio metrics, frequency distributions, and narrative summaries contextualized by biomedical literature.</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>Overview of AI-HOPE-WNT workflow. This figure illustrates the complete workflow of AI-HOPE-WNT, a conversational AI system developed to analyze WNT pathway dysregulation in colorectal cancer (CRC) using natural language interaction. <bold>(a)</bold> Shows how the user begins by entering a natural language query, such as requesting survival analysis of CRC patients with APC mutations treated with FOLFOX or comparing RNF43 mutation prevalence between early-onset Hispanic/Latino and non-Hispanic White patients. In <bold>(b)</bold>, the system processes this input through a graphical user interface (GUI) and uses a large language model (LLM) to interpret the query, generate executable code, and apply appropriate data filters and subgroup stratifications. <bold>(c)</bold> Illustrates how AI-HOPE-WNT retrieves and integrates harmonized clinical and genomic data from public sources such as TCGA and cBioPortal, focusing on WNT-relevant genes like APC, CTNNB1, AXIN1, AXIN2, and RNF43. Finally, <bold>(d)</bold> shows the automated execution of statistical analyses&#x2014;such as Kaplan&#x2013;Meier survival estimation or odds ratio testing&#x2014;with results presented as high-quality visualizations and narrative summaries. This flowchart highlights the streamlined, reproducible, and user-friendly nature of the AI-HOPE-WNT system, which supports rapid and scalable clinical-genomic investigation in precision oncology.</p>
</caption>
<graphic xlink:href="frai-08-1624797-g001.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Flowchart illustrating a data analysis process in four stages. a) A yellow box displays a natural language query about loading CRC data and selecting samples with FOLFOX treatment for case and control cohorts. b) A system with a graphical user interface processes the query, and an LLM generates code. c) Genomic data is integrated with clinical data into a dataset. d) Automatic statistical analysis results in a Kaplan-Meier survival curve and a stacked bar plot.</alt-text>
</graphic>
</fig>
<p>The AI-HOPE-WNT platform follows a structured, end-to-end workflow that transforms natural language queries into rigorous clinical-genomic analyses. Users begin by entering a plain English question&#x2014;for example, &#x201C;Compare survival in EOCRC patients with APC mutations versus wild-type receiving FOLFOX treatment.&#x201D; This query is interpreted by a fine-tuned large language model (LLaMA 3 variant), which converts the input into executable code using a natural language-to-code engine. The system then identifies and subsets relevant patient cohorts from harmonized cBioPortal datasets based on parameters such as mutation status, age, ethnicity, tumor location, MSI status, and treatment exposure. Once cohorts are defined, AI-HOPE-WNT performs statistical analyses appropriate to the query context, including odds ratio calculations, Kaplan&#x2013;Meier survival estimations, and Cox proportional hazards modeling. Results are returned as structured outputs&#x2014;such as tables, survival curves, and forest plots&#x2014;alongside automated narrative summaries contextualized by biomedical literature. Finally, the platform generates high-resolution visualizations and structured reports using Matplotlib and Plotly, enabling reproducible, publication-ready outputs. This integrated workflow enhances usability, transparency, and analytical rigor, establishing AI-HOPE-WNT as a robust tool for pathway-specific precision oncology research.</p>
</sec>
<sec id="sec8">
<title>LLM selection and configuration</title>
<p>The core language processing component of AI-HOPE-WNT is built on a variant of the LLaMA 3 large language model, selected for its balance of efficiency, scalability, and open architecture. This LLM was fine-tuned with domain-specific prompts and biomedical context to improve performance in interpreting clinical-genomic queries. The model operates within a retrieval-augmented generation (RAG) framework, which allows it to cross-reference structured biomedical knowledge sources during natural language-to-code translation. Prompt engineering techniques were applied to align model outputs with statistical and bioinformatics standards, reduce hallucination risk, and preserve analytical accuracy. Additionally, structured prompting ensures reproducibility, while the modular design allows for future upgrades or substitution with newer LLMs, ensuring continued adaptability as foundational AI models evolve.</p>
</sec>
<sec id="sec9">
<title>Evaluation metrics and statistical formulations</title>
<p>To evaluate cohort differences and mutation enrichment in AI-HOPE-WNT, we employed several standard statistical metrics. For categorical comparisons (e.g., mutation prevalence by subgroup), we used odds ratios (ORs), mathematically defined as:</p>
<p>where <italic>a</italic> and <italic>b</italic> represent the number of individuals with and without the mutation in group 1, and <italic>c</italic> and <italic>d</italic> represent the same in group 2. Confidence intervals (95%) for ORs were computed using the Woolf method.</p>
<disp-formula id="E1">
<mml:math id="M1">
<mml:mtext mathvariant="italic">OR</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>a</mml:mi>
<mml:mo>/</mml:mo>
<mml:mi>c</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>b</mml:mi>
<mml:mo>/</mml:mo>
<mml:mi>d</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
</mml:mfrac>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>a</mml:mi>
<mml:mo>&#x22C5;</mml:mo>
<mml:mi>d</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>b</mml:mi>
<mml:mo>&#x22C5;</mml:mo>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:math>
</disp-formula>
<p>For time-to-event data, we used Kaplan&#x2013;Meier survival estimates, with group differences assessed using the log-rank test, where the test statistic follows a chi-squared distribution:</p>
<disp-formula id="E2">
<mml:math id="M2">
<mml:msup>
<mml:mi>X</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:munderover>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:munderover>
<mml:mfrac>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi>O</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mfrac>
</mml:math>
</disp-formula>
<p>with <italic>O&#x2081;</italic> as observed events, <italic>E&#x2081;</italic> as expected events, and <italic>V&#x2081;</italic> as the variance. For multivariable survival analysis, we used Cox proportional hazards models, defined as:</p>
<disp-formula id="E3">
<mml:math id="M3">
<mml:mi>h</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>&#x2223;</mml:mo>
<mml:mi>X</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>h</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x22C5;</mml:mo>
<mml:mo>exp</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x03B2;</mml:mi>
<mml:mi>p</mml:mi>
</mml:msub>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>p</mml:mi>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</disp-formula>
<p>where h(t&#x2223;X) is the hazard function at time <italic>t</italic> given covariates <italic>X</italic>, and <italic>&#x03B2;</italic> values are estimated log hazard ratios. Model significance was determined via likelihood ratio tests and Wald statistics.</p>
<p>These evaluation metrics are implemented programmatically within AI-HOPE-WNT&#x2019;s statistical backend to ensure consistency, interpretability, and reproducibility across analyses.</p>
</sec>
<sec id="sec10">
<title>Data integration and preprocessing</title>
<p>AI-HOPE-WNT interfaces with harmonized CRC datasets curated from cBioPortal and The Cancer Genome Atlas (TCGA), with emphasis on WNT-relevant gene mutations (e.g., APC, CTNNB1, RNF43, AXIN1, AXIN2). Clinical variables such as age, gender, tumor location, stage, microsatellite instability (MSI) status, and treatment regimen (e.g., FOLFOX) were included. Genomic annotations and mutation profiles were preprocessed into standardized, tab-delimited formats with unified sample IDs. Metadata were harmonized using established ontologies (e.g., OncoTree, Disease Ontology) to ensure interoperability. Data validation included cross-referencing gene mutation calls, consistency checks, and enrichment annotations for WNT-associated genes.</p>
</sec>
<sec id="sec11">
<title>Natural language query processing and case subsetting</title>
<p>Users interact with the platform via plain English queries that are interpreted by an LLM (LLaMA 3) and translated into structured data operations. AI-HOPE-WNT allows for flexible cohort definitions, enabling stratification by mutation status, clinical features, treatment exposure, or demographic characteristics. For example, users can query &#x201C;Compare survival between EOCRC patients with APC mutations vs. wild-type in FOLFOX-treated tumors&#x201D; or &#x201C;Identify co-occurrence between AXIN2 and RNF43 in rectal tumors among Hispanic/Latino patients.&#x201D; The system prompts clarifications when inputs are ambiguous, enhancing transparency and preventing spurious analyses.</p>
</sec>
<sec id="sec12">
<title>Statistical and bioinformatics analysis</title>
<p>Analyses are conducted via Python-based pipelines integrated into the backend. For categorical variables, the system computes frequency distributions, chi-square or Fisher&#x2019;s exact tests, and odds ratios with 95% confidence intervals. Time-to-event data are analyzed using Kaplan&#x2013;Meier survival estimation and log-rank tests; Cox proportional hazards regression is applied for multivariate analyses. WNT-focused genes were prioritized for mutation enrichment, co-mutation, and prognostic modeling. The platform supports subgroup exploration by age (&#x003C;50 vs. &#x2265;50), ethnicity (Hispanic/Latino vs. non-Hispanic White), and tumor location (colon vs. rectal).</p>
</sec>
<sec id="sec13">
<title>System engineering and validation</title>
<p>AI-HOPE-WNT integrates a retrieval-augmented generation (RAG) engine that references a structured biomedical knowledge base to support contextual accuracy and limit hallucinations. Structured prompting ensures adherence to bioinformatics conventions and enables reproducibility across analytical outputs. To validate platform performance, we replicated key findings from our previously published studies (<xref ref-type="bibr" rid="ref26">Song et al., 2023</xref>; <xref ref-type="bibr" rid="ref35">Youssef et al., 2025</xref>; <xref ref-type="bibr" rid="ref10">Cerami et al., 2012</xref>), including RNF43 and AXIN2 mutation differences in EOCRC H/L and survival trends associated with WNT pathway alterations.</p>
</sec>
<sec id="sec14">
<title>Baseline comparison and performance evaluation</title>
<p>To benchmark the performance of AI-HOPE-WNT, we conducted a task-based comparison with two widely used platforms&#x2014;cBioPortal and UCSC Xena&#x2014;which served as baseline tools. Performance was evaluated across three core dimensions: (1) execution time, measured from query input to analysis output; (2) workflow complexity, defined by the number of steps or interface interactions required to complete a query; and (3) subgroup analysis flexibility, assessed by the ability to stratify cohorts across multiple demographic and clinical variables (e.g., age, ethnicity, treatment, mutation status). For example, a survival analysis stratified by APC mutation status and FOLFOX treatment in early-onset Hispanic/Latino patients required only a single query in AI-HOPE-WNT, compared to 6&#x2013;8 manual steps in cBioPortal and Xena. Quantitatively, AI-HOPE-WNT reduced average task completion time by 72% and enabled nested subgroup comparisons that were not natively supported in baseline tools. These results underscore the platform&#x2019;s superior efficiency, usability, and analytic scope&#x2014;particularly in real-time, natural language-driven settings focused on pathway-specific precision oncology.</p>
</sec>
<sec id="sec15">
<title>Visualization and output</title>
<p>Post-analysis, the platform generates structured reports including summary statistics, mutation frequency tables, survival plots, and forest plots. Narrative interpretations are auto-generated, linking statistical findings to literature-derived insights. Visualizations were rendered using Matplotlib and Plotly within the backend, ensuring high-resolution graphics suitable for scientific reporting.</p>
</sec>
</sec>
<sec sec-type="results" id="sec16">
<title>Results</title>
<sec id="sec17">
<title>AI-HOPE-WNT enables real-time clinical-genomic integration and natural language query execution</title>
<p>AI-HOPE-WNT was developed to transform natural language prompts into automated clinical-genomic analyses, allowing real-time exploration of WNT signaling dysregulation in CRC. The system integrates structured datasets with natural language queries, enabling users to dynamically stratify patient cohorts based on tumor location, age, sex, mutation status, microsatellite instability (MSI), and treatment exposure. In response to these queries, the platform executes statistical procedures such as Kaplan&#x2013;Meier survival analysis, odds ratio testing, and mutation frequency comparisons, and presents the results through high-resolution visualizations and narrative summaries. This functionality allows non-coding users&#x2014;including clinicians and translational researchers&#x2014;to interactively generate and test hypotheses in an intuitive and reproducible manner. The results presented here demonstrate AI-HOPE-WNT&#x2019;s capacity to both replicate previously published findings and uncover novel associations across EOCRC populations.</p>
</sec>
<sec id="sec18">
<title>Recapitulation of known WNT pathway alterations and survival associations</title>
<p>To validate the analytical robustness of the platform, AI-HOPE-WNT was applied to replicate previously reported associations between WNT pathway mutations and clinical outcomes in EOCRC patients. Using survival modeling, the system reproduced findings from a published CRC WNT study (<xref ref-type="bibr" rid="ref21">Monge et al., 2024</xref>), comparing outcomes among EOCRC patients with and without WNT pathway mutations. In Hispanic/Latino (H/L) patients, WNT-altered tumors were associated with significantly improved survival (<italic>p</italic> =&#x202F;0.0167), and a similar trend was observed in non-Hispanic White (NHW) patients, where survival differences were even more pronounced (<italic>p</italic> =&#x202F;0.0007) (<xref ref-type="fig" rid="fig2">Figure 2</xref>). These findings confirm prior evidence that WNT pathway activation, in certain molecular and demographic contexts, may have prognostic relevance in EOCRC.</p>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>AI-HOPE-WNT recapitulation of survival outcomes in early-onset colorectal cancer (EOCRC) patients with and without WNT pathway alterations. This figure highlights AI-HOPE-WNT&#x2019;s capability to reproduce key findings from prior studies by analyzing survival outcomes in EOCRC patients stratified by WNT pathway alteration status and ancestry group. <bold>(a)</bold> The platform defines two cohorts among EOCRC Hispanic/Latino (H/L) patients: a case cohort with WNT pathway alterations (<italic>n</italic>&#x202F;=&#x202F;125; 2.3%) and a control cohort without WNT alterations (<italic>n</italic>&#x202F;=&#x202F;28; 0.5%). Pie charts visualize the distribution of selected samples relative to the entire dataset, emphasizing the rarity of unaltered WNT pathway cases in this subgroup. <bold>(b)</bold> Kaplan&#x2013;Meier survival analysis comparing these two H/L cohorts reveals significantly improved overall survival in the WNT-altered group (<italic>p</italic>&#x202F;=&#x202F;0.0167), indicating a potential protective role for WNT pathway mutations in this demographic. <bold>(c)</bold> Similarly, two cohorts were created for EOCRC non-Hispanic White (NHW) patients: those with WNT pathway alterations (<italic>n</italic>&#x202F;=&#x202F;894; 16.1%) and those without (<italic>n</italic>&#x202F;=&#x202F;223; 4.0%). The sample distributions are visualized via pie charts, highlighting a larger proportion of NHW patients in both WNT-altered and unaltered groups compared to the H/L subgroup. <bold>(d)</bold> Survival analysis for NHW patients shows a highly significant difference in outcomes (<italic>p</italic>&#x202F;=&#x202F;0.0007), with WNT-altered individuals demonstrating superior survival.</p>
</caption>
<graphic xlink:href="frai-08-1624797-g002.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Panels (a) and (c) feature pie charts depicting sample distributions. Panel (a) shows 97.7% others and 2.3% selected; panel (c) shows 83.9% others and 16.1% selected. Panels (b) and (d) illustrate Kaplan-Meier survival curves for case and control groups. Panel (b) shows a p-value of 0.0167, while panel (d) shows a p-value of 0.0007, with separate curves for case (blue) and control (orange) groups over 100 months.</alt-text>
</graphic>
</fig>
<p>Additionally, AI-HOPE-WNT reproduced previously reported trends in ancestry-specific mutation enrichment. Odds ratio testing showed that RNF43 mutations were more prevalent in H/L patients compared to NHW, with an odds ratio of 1.31 (<xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S1</xref>). Although the platform&#x2019;s dataset included a smaller number of H/L samples than the original study, the observed enrichment supports the reproducibility and ancestry-awareness of the platform&#x2019;s analytical workflow. Together, these validations highlight the platform&#x2019;s capability to replicate established WNT pathway associations through fully automated, natural language&#x2013;driven analysis.</p>
</sec>
<sec id="sec19">
<title>Impact of APC mutations on survival in FOLFOX-treated EOCRC</title>
<p>Exploratory analysis using AI-HOPE-WNT revealed a significant survival advantage among EOCRC patients treated with FOLFOX who harbored mutations in the APC gene. In patients under the age of 50, APC mutations were associated with significantly improved survival compared to wild-type cases (<italic>p</italic> =&#x202F;0.0027) (<xref ref-type="fig" rid="fig3">Figure 3</xref>). These findings suggest that APC mutation status may influence treatment response to FOLFOX in younger CRC patients and highlight the potential utility of pathway-specific AI agents for evaluating molecular markers within therapeutic contexts.</p>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption>
<p>AI-HOPE-WNT analysis of early-onset colorectal cancer (EOCRC) patients treated with FOLFOX stratified by APC mutation status. This figure presents the results of a natural language query executed via AI-HOPE-WNT, investigating the impact of APC mutation status on survival among EOCRC patients treated with combination chemotherapy (FLUOROURACIL, LEUCOVORIN, and OXALIPLATIN). <bold>(a)</bold> The user-defined cohort includes CRC patients under the age of 50 who received FOLFOX-based treatment. A histogram illustrates the age distribution within the full dataset (mean: 57.92&#x202F;years), providing context for the selection of early-onset cases. <bold>(b)</bold> Two cohorts are defined: one with APC mutations (<italic>n</italic>&#x202F;=&#x202F;950; 17.1%) and one without APC mutations (<italic>n</italic>&#x202F;=&#x202F;304; 5.5%). Corresponding pie charts display the proportional representation of each cohort relative to the total dataset. <bold>(c)</bold> Kaplan&#x2013;Meier survival analysis reveals a significant difference in survival outcomes between the APC-mutated (case) and APC wild-type (control) groups (<italic>p</italic>&#x202F;=&#x202F;0.0027).</p>
</caption>
<graphic xlink:href="frai-08-1624797-g003.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">(a) A histogram with a density curve shows the distribution of values, highlighting central clustering. Mean is 57.92, median is 57.75. (b) A pie chart illustrating sample distribution: 17.1 percent selected and 82.9 percent others. Another pie chart shows 5.5 percent selected, 94.5 percent others. (c) Kaplan-Meier survival curve comparing case and control groups with a p-value of 0.0027, indicating a significant difference over time.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec20">
<title>Stage-specific outcomes in RNF43-mutated CRC</title>
<p>The platform was also used to explore survival outcomes based on tumor stage among RNF43-mutated CRC patients. AI-HOPE-WNT identified a significant survival disadvantage in patients with Stage IV (metastatic) tumors compared to those with Stage I&#x2013;III (non-metastatic) disease (<italic>p</italic> &#x003C;&#x202F;0.0001) (<xref ref-type="fig" rid="fig4">Figure 4</xref>). This result underscores the prognostic importance of tumor stage in RNF43-mutant CRC and demonstrates how AI-HOPE-WNT can uncover nuanced, mutation-specific insights through stratified cohort comparisons.</p>
<fig position="float" id="fig4">
<label>Figure 4</label>
<caption>
<p>AI-HOPE-WNT analysis of RNF43-mutant colorectal cancer (CRC) patients by tumor stage (primary vs. metastatic). This figure demonstrates how AI-HOPE-WNT enables survival analysis of CRC patients harboring RNF43 mutations, stratified by tumor stage to compare outcomes between primary (Stage I&#x2013;III) and metastatic (Stage IV) disease. <bold>(a)</bold> The initial data exploration phase uses bar plots to summarize patient distribution by tumor stage among RNF43-mutated CRC cases. The top chart shows absolute counts (Stage I&#x2013;III: <italic>n</italic>&#x202F;=&#x202F;3,171; Stage IV: <italic>n</italic>&#x202F;=&#x202F;2,372), while the bottom chart displays proportional representation (Stage I&#x2013;III: 51.7%; Stage IV: 38.7%), confirming sufficient subgroup sample sizes for comparative analysis. <bold>(b)</bold> Based on the defined query, two pie charts illustrate the relative sizes of the selected case (Stage I&#x2013;III, <italic>n</italic>&#x202F;=&#x202F;452) and control (Stage IV, <italic>n</italic>&#x202F;=&#x202F;111) cohorts against the background dataset. These subsets correspond to 7.4 and 1.8% of the total patient population, respectively, indicating lower prevalence of RNF43 mutations in advanced-stage CRC. <bold>(c)</bold> Kaplan&#x2013;Meier survival analysis is then conducted to evaluate outcome differences between the two groups. The upper survival plot shows significantly improved survival in the Stage I&#x2013;III (primary tumor) group relative to the Stage IV (metastatic) group (<italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001), with visibly distinct survival curves and non-overlapping confidence intervals. The bottom survival plot is a placeholder indicating no data for a corresponding comparison, potentially due to an absence of relevant events or an error in query execution.</p>
</caption>
<graphic xlink:href="frai-08-1624797-g004.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Panel (a) shows bar charts of counts and percentages for values, with Stage 1-3 having higher values than Stage 4. Panel (b) displays pie charts of sample distribution, with a large majority classified as "Others." Panel (c) features Kaplan-Meier survival curves, showing a distinct survival difference between case and control groups, with a significant p-value of 0.0000.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec21">
<title>Tumor location and co-mutation patterns between AXIN1 and APC</title>
<p>Using natural language queries, AI-HOPE-WNT investigated co-mutation patterns between AXIN1 and APC by tumor location. Odds ratio testing revealed differential enrichment of APC co-mutations in colon versus rectal tumors. However, Kaplan&#x2013;Meier survival analysis showed no statistically significant survival differences between these anatomical subgroups (<italic>p</italic> =&#x202F;0.2216) (<xref ref-type="fig" rid="fig5">Figure 5</xref>). These results suggest that while co-mutation patterns may vary by location, their prognostic impact may be limited&#x2014;or require larger datasets for confirmation&#x2014;highlighting the platform&#x2019;s potential for guiding further inquiry.</p>
<fig position="float" id="fig5">
<label>Figure 5</label>
<caption>
<p>AI-HOPE-WNT analysis of AXIN1-mutant colorectal cancer (CRC) by tumor location: colon vs. rectal adenocarcinoma. This figure illustrates the use of AI-HOPE-WNT to analyze CRC patients with AXIN1 mutations, comparing colon versus rectal adenocarcinomas. The analysis includes an odds ratio test contextualized by APC mutation status and a Kaplan&#x2013;Meier survival analysis. <bold>(a)</bold> The initial panel shows distribution plots of tumor types in the dataset. Colon adenocarcinoma (X0) is the most prevalent subtype (<italic>n</italic>&#x202F;=&#x202F;3,790), followed by rectal adenocarcinoma (X1, <italic>n</italic>&#x202F;=&#x202F;1,476). The top bar chart shows the counts of each tumor subtype, while the bottom plot presents their relative proportions (60.8 and 23.7%, respectively). <bold>(b)</bold> Pie charts summarize the cohort refinement process based on the specified query: selecting CRC patients with AXIN1 mutations and categorizing them by tumor type. The upper pie chart shows the case group (colon adenocarcinoma with AXIN1 mutation, <italic>n</italic>&#x202F;=&#x202F;146) as 2.4% of the dataset, while the control group (rectal adenocarcinoma with AXIN1 mutation, <italic>n</italic>&#x202F;=&#x202F;22) makes up only 0.4%, highlighting the rarity of co-mutations in the control group. <bold>(c)</bold> A 2&#x00D7;2 odds ratio analysis is performed using APC mutation status as contextual stratification. The stacked bar plot visualizes the outcome categories (In_Context vs. Out_of_Context) across case and control groups. This analysis allows the user to explore whether APC mutations are differentially enriched among colon versus rectal tumors in the presence of AXIN1 mutations. <bold>(d)</bold> Kaplan&#x2013;Meier survival curves compare survival outcomes between the two tumor locations in the AXIN1-mutated population. While the curves diverge, suggesting some difference in survival probability, the <italic>p</italic>-value (0.2216) indicates no statistically significant difference under the current sample conditions.</p>
</caption>
<graphic xlink:href="frai-08-1624797-g005.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">(a) Two bar plots showing the distribution of cancer types by count and percentage. X0 has the highest count and percentage. (b) Two pie charts displaying the distribution of selected samples, with 97.6% and 99.6% labeled as others. (c) Stacked bar plot illustrating odds ratio analysis for case and control groups, divided by context. (d) Kaplan-Meier survival curve comparing survival probabilities over time between case and control groups, with a p-value of 0.2216.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec22">
<title>Sex-based differences in survival among AXIN2-mutated patients stratified by MSI</title>
<p>Sex-based survival differences were evaluated among AXIN2-mutated patients, stratified by MSI status. A trend toward worse progression-free survival was observed in male patients relative to females, though the difference did not reach statistical significance (<italic>p</italic> =&#x202F;0.1274). Nevertheless, odds ratio analysis revealed MSI-stable enrichment in both male and female subgroups (<xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S2</xref>), indicating potential interactions between gender, microsatellite status, and WNT signaling. These findings illustrate how AI-HOPE-WNT can facilitate exploration of under-investigated biological interactions using clinical-genomic data.</p>
</sec>
<sec id="sec23">
<title>Age-stratified analysis of APC mutation prevalence and prognosis</title>
<p>AI-HOPE-WNT was used to assess the relationship between APC mutation prevalence and age in primary CRC tumors. Among 3,396 APC-mutant and 1,252 wild-type cases, odds ratio testing showed that APC mutations were significantly more prevalent in EOCRC patients (&#x003C;50&#x202F;years). Further, Kaplan&#x2013;Meier survival analysis demonstrated significantly improved outcomes in APC-mutated tumors (<italic>p</italic> =&#x202F;0.00001) (<xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S3</xref>). This supports the prognostic relevance of APC mutations in younger CRC populations and illustrates how AI-HOPE-WNT can stratify patients for biomarker discovery.</p>
</sec>
<sec id="sec24">
<title>Summary of analytical capabilities and insights</title>
<p>Collectively, these results showcase the analytical range and depth of AI-HOPE-WNT. The platform successfully replicated prior WNT-related findings while generating new hypotheses linking gene alterations to survival outcomes across treatment types, tumor stages, demographics, and molecular subgroups. By enabling real-time, natural language&#x2013;driven analysis of harmonized clinical-genomic data, AI-HOPE-WNT offers a novel, scalable approach to translational discovery in colorectal cancer. Its ability to handle complex stratification and return visual and statistical outputs makes it a powerful tool for precision oncology research, education, and clinical hypothesis testing.</p>
</sec>
</sec>
<sec sec-type="discussion" id="sec25">
<title>Discussion</title>
<p>AI-HOPE-WNT introduces a paradigm shift in pathway-specific precision oncology by enabling natural language&#x2013;driven exploration of WNT signaling dysregulation in CRC. Unlike conventional platforms that require manual filtering, pre-defined workflows, or scripting knowledge, AI-HOPE-WNT translates user prompts into automated, rigorous analyses encompassing survival modeling, odds ratio testing, and mutation frequency comparison&#x2014;streamlining hypothesis generation and reducing technical barriers. This system offers a flexible and scalable framework to interrogate clinical-genomic relationships, particularly within the context of EOCRC and underserved populations.</p>
<p>A defining strength of AI-HOPE-WNT lies in its ability to dynamically stratify CRC patient cohorts by WNT gene mutation status (e.g., APC, AXIN1/2, RNF43), tumor location, age group, treatment exposure (e.g., FOLFOX), and molecular phenotype (e.g., MSI). For example, in EOCRC patients treated with FOLFOX, AI-HOPE-WNT detected improved survival among those harboring APC mutations&#x2014;supporting the prognostic relevance of this canonical WNT gene in treatment contexts. Similarly, by comparing RNF43-mutant patients across tumor stages, the platform revealed a significant survival disadvantage in metastatic cases, a finding that would otherwise require multi-step analyses in standard bioinformatics tools.</p>
<p>Importantly, the conversational design of AI-HOPE-WNT empowers researchers, clinicians, and students to interact directly with large-scale genomics data using plain English, eliminating the need for programming expertise. Through this interface, users were able to uncover gender-specific survival trends in AXIN2-mutated cases under microsatellite stability conditions and explore co-mutation enrichment by tumor site. These observations highlight the utility of AI-HOPE-WNT for dissecting complex molecular interactions and demographic disparities that have historically been underexplored due to analytic barriers.</p>
<p>The platform&#x2019;s validation phase confirmed its analytical reliability by reproducing prior findings from Hispanic/Latino CRC disparity studies, specifically the enrichment of RNF43 and AXIN2 mutations in EOCRC and the favorable survival associated with WNT pathway alterations. Exploratory results expanded on these findings, including the association between APC mutations and earlier age of onset&#x2014;a hypothesis supported by both prevalence data and Kaplan&#x2013;Meier survival analysis. These insights reinforce the potential of AI-HOPE-WNT to inform biomarker discovery, therapeutic stratification, and population-specific interventions.</p>
<p>From a systems engineering standpoint, AI-HOPE-WNT leverages a modular LLM framework coupled with retrieval-augmented generation (RAG) and biomedical ontologies to ensure accurate, reproducible, and context-aware outputs. This design significantly reduces hallucinations while preserving statistical integrity, enabling robust and interpretable bioinformatics workflows. Benchmarking showed that AI-HOPE-WNT outperforms traditional platforms in execution time and flexibility, particularly for nested subgroup comparisons and multi-parameter stratifications.</p>
<p>Recent advances in AI-based biomedical research have demonstrated the utility of machine learning for feature extraction, classification, and diagnostic insight across a range of biological systems. For instance a previous effort (<xref ref-type="bibr" rid="ref11">Chen et al., 2025</xref>) developed a machine learning framework (CLPr_in_ML) to classify cleft lip and palate abnormalities using CBCT imaging and feature reconstruction techniques, achieving high performance with various operator-based features. Similarly, the Golgi_DF framework (<xref ref-type="bibr" rid="ref2">Bao et al., 2023</xref>) introduced a deep forest algorithm for the classification of Golgi proteins, incorporating synthetic oversampling and feature reduction to improve model accuracy and biological interpretability. These efforts align with the goals of AI-HOPE-WNT in demonstrating how AI systems can enhance biomedical analysis through structured feature interpretation and machine learning&#x2013;driven discovery. While their application domains differ&#x2014;structural imaging and proteomics, respectively&#x2014;these models underscore the broader relevance of AI in supporting biologically meaningful stratification, which parallels our objective of automating clinical-genomic interrogation within the context of WNT pathway dysregulation in colorectal cancer.</p>
<p>The development of AI-HOPE-WNT builds upon our previous work establishing a suite of AI-driven agents designed to facilitate clinical-genomic integration in precision oncology. Our initial platform, AI-HOPE (<xref ref-type="bibr" rid="ref32">Yang and Velazquez-Villarreal, 2025</xref>), introduced a general-purpose conversational agent capable of harmonizing and analyzing cancer genomics and clinical data using natural language inputs. This foundational framework established the modular architecture&#x2014;combining LLMs, natural language-to-code translation, and backend statistical engines&#x2014;that underpins all subsequent AI-HOPE agents. Expanding on this, we developed AI-HOPE-TGFbeta (<xref ref-type="bibr" rid="ref33">Yang et al., 2025a</xref>), the first pathway-specific conversational agent focused on interrogating TGF-<italic>&#x03B2;</italic> alterations in CRC, demonstrating the platform&#x2019;s ability to replicate known findings and stratify patients across clinical variables. Most recently, AI-HOPE-PI3K (<xref ref-type="bibr" rid="ref34">Yang et al., 2025b</xref>) extended this approach to the PI3K signaling pathway, highlighting the prognostic relevance of PI3K alterations and validating the agent&#x2019;s capacity for mutation-driven survival modeling. AI-HOPE-WNT advances this line of work by targeting the WNT pathway&#x2014;one of the most frequently altered and clinically relevant signaling axes in CRC&#x2014;further refining pathway-specific stratification and enabling exploratory hypothesis testing across age, ethnicity, tumor location, and treatment response. Collectively, these projects represent an evolving ecosystem of AI-HOPE agents, each purpose-built to support scalable, accessible, and reproducible analysis of key molecular pathways driving cancer disparities and outcomes.</p>
<p>As part of a broader initiative to develop a family of specialized AI agents, AI-HOPE-WNT was developed with a unique architecture specifically tailored to the complexity of the WNT signaling pathway in CRC. While sharing a common conceptual framework, this agent features distinct structural components compared to previously published models&#x2014;AI-HOPE-TGFbeta (<xref ref-type="bibr" rid="ref33">Yang et al., 2025a</xref>) and AI-HOPE-PI3K (<xref ref-type="bibr" rid="ref34">Yang et al., 2025b</xref>)&#x2014;with each AI agent intentionally designed as a modular, standalone system optimized for interrogating a specific molecular pathway. This pathway-specific approach is based on the rationale that key oncogenic pathways such as WNT, TGF-<italic>&#x03B2;</italic>, and PI3K exhibit unique mutational patterns, prognostic relevance, and population-specific implications, particularly in early-onset CRC. Developing specialized agents allows for more precise validation, biologically focused natural language querying, and pathway-specific hypothesis generation&#x2014;capabilities that would be challenging to achieve within a single, general-purpose model. This modular design also supports independent benchmarking and iterative refinement, thereby enhancing transparency and reproducibility. Another example of a specialized agent is AI-HOPE (<xref ref-type="bibr" rid="ref32">Yang and Velazquez-Villarreal, 2025</xref>), which was developed to support integrative clinical and genomic data analysis across broader cancer research settings. Looking forward, the research team envisions integrating these agents into a collaborative and interoperable framework. To enable this, they are actively exploring Agent-to-Agent (A2A) communication protocols and Multi-Agent Collaboration Protocols (MCP), which would allow coordination among agents and facilitate the resolution of complex, multi-pathway queries. This direction supports the long-term goal of building an intelligent, scalable AI ecosystem for precision oncology&#x2014;capable of modeling the molecular heterogeneity of cancer across diverse populations and clinical contexts.</p>
<p>In response to the growing demand for accessible AI tools in precision oncology, the development team acknowledges the importance of creating a web-based interface to broaden the usability of the AI-HOPE-WNT platform beyond users with programming expertise. While the current version of AI-HOPE-WNT is publicly available on GitHub with full source code and documentation, efforts are underway to develop a web-based application that offers an intuitive and interactive user experience. This planned interface would enable clinicians, researchers, and trainees to submit natural language queries, perform stratified cohort analyses, and generate visual reports directly through a browser-based environment. By reducing technical barriers, such a platform would help democratize access to clinical-genomic integration tools, support educational and training initiatives, and enable real-time hypothesis generation in translational cancer research. This direction is viewed as a critical next step toward expanding the reach and impact of the AI-HOPE-WNT platform across the precision oncology community.</p>
<p>Nonetheless, future enhancements are warranted. Expanding AI-HOPE-WNT to incorporate multi-omics layers&#x2014;such as transcriptomic, proteomic, and spatial data&#x2014;will broaden its analytic capacity. Integration with federated learning frameworks and secure data environments could also facilitate deployment in clinical settings where patient privacy and continual data updates are essential. Comparative benchmarking against emerging AI-driven platforms like CellAgent and AutoBA will be critical to assess generalizability and performance across broader cancer domains.</p>
</sec>
<sec sec-type="conclusions" id="sec26">
<title>Conclusion</title>
<p>AI-HOPE-WNT represents a significant advancement in precision oncology by enabling real-time, pathway-specific analysis of CRC through a natural language interface. By integrating genomic, clinical, and demographic data, the platform empowers users to explore WNT signaling alterations and their prognostic implications across diverse patient subgroups. Its ability to validate prior findings, generate novel hypotheses, and perform scalable, reproducible analyses without coding expertise underscores its value as both a research and translational tool. With continued development, AI-HOPE-WNT holds promise for accelerating biomarker discovery, informing equitable treatment strategies, and supporting next-generation, AI-driven cancer care.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec27">
<title>Data availability statement</title>
<p>Publicly available datasets were analyzed in this study. This data can be found here: the source data used in this study were publicly available before the initiation of the study and can be accessed through cBioPortal for cancer genomics at: <ext-link xlink:href="https://www.cbioportal.org/" ext-link-type="uri">https://www.cbioportal.org/</ext-link>.</p>
</sec>
<sec sec-type="ethics-statement" id="sec28">
<title>Ethics statement</title>
<p>The studies involving humans were approved by Memorial Sloan Kettering Cancer Center (MSK) Institutional Review Board. The studies were conducted in accordance with the local legislation and institutional requirements. Written informed consent for participation was not required from the participants or the participants&#x2019; legal guardians/next of kin in accordance with the national legislation and institutional requirements.</p>
</sec>
<sec sec-type="author-contributions" id="sec29">
<title>Author contributions</title>
<p>E-WY: Investigation, Methodology, Conceptualization, Writing &#x2013; review &#x0026; editing, Software, Visualization, Writing &#x2013; original draft. BW: Validation, Formal analysis, Visualization, Data curation, Writing &#x2013; original draft, Investigation, Writing &#x2013; review &#x0026; editing. EV-V: Visualization, Writing &#x2013; original draft, Data curation, Formal analysis, Software, Methodology, Funding acquisition, Conceptualization, Resources, Supervision, Project administration, Investigation, Validation, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec sec-type="funding-information" id="sec30">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This research was funded by the Department of Integrative Translational Sciences at City of Hope, the City of Hope Cancer Control and Population Sciences Program, National Cancer Institute (NCI), National Institute of Health (NIH), award number NIH/NCI P30-CA033572; NIH, NCI, Cancer Moonshot project, PE-CGS: Optimizing Engagement of Hispanic Colorectal Cancer Patients in Cancer Genomic Characterization Studies, award number NIH/NCI U2C-CA252971; and NIH, NCI, U54 University of California Riverside (UCR) and City of Hope Comprehensive Cancer Center (COH-CCC) partnership, Drug Development and Capacity Building, award number NIH/NCI U54-CA285116.</p>
</sec>
<sec sec-type="COI-statement" id="sec31">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="sec32">
<title>Generative AI statement</title>
<p>The author(s) declare that no Gen AI was used in the creation of this manuscript.</p>
</sec>
<sec sec-type="disclaimer" id="sec33">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="sec34">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/frai.2025.1624797/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/frai.2025.1624797/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Antelo</surname> <given-names>M.</given-names></name> <name><surname>Balaguer</surname> <given-names>F.</given-names></name> <name><surname>Shia</surname> <given-names>J.</given-names></name> <name><surname>Shen</surname> <given-names>Y.</given-names></name> <name><surname>Hur</surname> <given-names>K.</given-names></name> <name><surname>Moreira</surname> <given-names>L.</given-names></name> <etal/></person-group>. (<year>2012</year>). <article-title>A high degree of LINE-1 hypomethylation is a unique feature of early-onset colorectal cancer</article-title>. <source>PLoS One</source> <volume>7</volume>:<fpage>e45357</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0045357</pub-id>, PMID: <pub-id pub-id-type="pmid">23049789</pub-id></citation></ref>
<ref id="ref2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bao</surname> <given-names>W.</given-names></name> <name><surname>Gu</surname> <given-names>Y.</given-names></name> <name><surname>Chen</surname> <given-names>B.</given-names></name> <name><surname>Yu</surname> <given-names>H.</given-names></name></person-group> (<year>2023</year>). <article-title>Golgi_DF: Golgi proteins classification with deep forest</article-title>. <source>Front. Neurosci.</source> <volume>17</volume>:<fpage>1197824</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fnins.2023.1197824</pub-id>, PMID: <pub-id pub-id-type="pmid">37250391</pub-id></citation></ref>
<ref id="ref3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bhalla</surname> <given-names>S.</given-names></name> <name><surname>Lagan&#x00E0;</surname> <given-names>A.</given-names></name></person-group> (<year>2022</year>). <article-title>Artificial intelligence for precision oncology</article-title>. <source>Adv. Exp. Med. Biol.</source> <volume>1361</volume>, <fpage>249</fpage>&#x2013;<lpage>268</lpage>. doi: <pub-id pub-id-type="doi">10.1007/978-3-030-91836-1_14</pub-id>, PMID: <pub-id pub-id-type="pmid">35230693</pub-id></citation></ref>
<ref id="ref4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bhinder</surname> <given-names>B.</given-names></name> <name><surname>Gilvary</surname> <given-names>C.</given-names></name> <name><surname>Madhukar</surname> <given-names>N. S.</given-names></name> <name><surname>Elemento</surname> <given-names>O.</given-names></name></person-group> (<year>2021</year>). <article-title>Artificial intelligence in Cancer research and precision medicine</article-title>. <source>Cancer Discov.</source> <volume>11</volume>, <fpage>900</fpage>&#x2013;<lpage>915</lpage>. doi: <pub-id pub-id-type="doi">10.1158/2159-8290.CD-21-0090</pub-id>, PMID: <pub-id pub-id-type="pmid">33811123</pub-id></citation></ref>
<ref id="ref5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bugter</surname> <given-names>J. M.</given-names></name> <name><surname>Fenderico</surname> <given-names>N.</given-names></name> <name><surname>Maurice</surname> <given-names>M. M.</given-names></name></person-group> (<year>2021</year>). <article-title>Mutations and mechanisms of WNT pathway tumour suppressors in cancer</article-title>. <source>Nat. Rev. Cancer</source> <volume>21</volume>, <fpage>5</fpage>&#x2013;<lpage>21</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41568-020-00307-z</pub-id></citation></ref>
<ref id="ref6"><citation citation-type="journal"><person-group person-group-type="author"><collab id="coll1">Cancer Genome Atlas Network</collab></person-group> (<year>2012</year>). <article-title>Comprehensive molecular characterization of human colon and rectal cancer</article-title>. <source>Nature</source> <volume>487</volume>, <fpage>330</fpage>&#x2013;<lpage>337</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nature11252</pub-id>, PMID: <pub-id pub-id-type="pmid">22810696</pub-id></citation></ref>
<ref id="ref7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carl&#x00E0;</surname> <given-names>M. M.</given-names></name> <name><surname>Gambini</surname> <given-names>G.</given-names></name> <name><surname>Giannuzzi</surname> <given-names>F.</given-names></name> <name><surname>Boselli</surname> <given-names>F.</given-names></name> <name><surname>De Luca</surname> <given-names>L.</given-names></name> <name><surname>Rizzo</surname> <given-names>S.</given-names></name></person-group> (<year>2025</year>). <article-title>Testing the reliability of ChatGPT assistance for surgical choices in challenging Glaucoma cases</article-title>. <source>J Pers Med.</source> <volume>15</volume>:<fpage>97</fpage>. doi: <pub-id pub-id-type="doi">10.3390/jpm15030097</pub-id>, PMID: <pub-id pub-id-type="pmid">40137413</pub-id></citation></ref>
<ref id="ref8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carranza</surname> <given-names>F. G.</given-names></name> <name><surname>Diaz</surname> <given-names>F. C.</given-names></name> <name><surname>Ninova</surname> <given-names>M.</given-names></name> <name><surname>Velazquez-Villarreal</surname> <given-names>E.</given-names></name></person-group> (<year>2024</year>). <article-title>Current state and future prospects of spatial biology in colorectal cancer</article-title>. <source>Front. Oncol.</source> <volume>14</volume>:<fpage>1513821</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fonc.2024.1513821</pub-id>, PMID: <pub-id pub-id-type="pmid">39711954</pub-id></citation></ref>
<ref id="ref9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carranza</surname> <given-names>F. G.</given-names></name> <name><surname>Waldrup</surname> <given-names>B.</given-names></name> <name><surname>Jin</surname> <given-names>Y.</given-names></name> <name><surname>Amzaleg</surname> <given-names>Y.</given-names></name> <name><surname>Postel</surname> <given-names>M.</given-names></name> <name><surname>Craig</surname> <given-names>D. W.</given-names></name> <etal/></person-group>. (<year>2025</year>). <article-title>Assessment of MYC gene and WNT pathway alterations in early-onset colorectal cancer among Hispanic/Latino patients using integrated multi-omics approaches</article-title>. <source>medRxiv</source> [Preprint], <fpage>2024.12.05.24318588</fpage>. doi: <pub-id pub-id-type="doi">10.1101/2024.12.05.24318588</pub-id>, PMID: <pub-id pub-id-type="pmid">40034762</pub-id></citation></ref>
<ref id="ref10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cerami</surname> <given-names>E.</given-names></name> <name><surname>Gao</surname> <given-names>J.</given-names></name> <name><surname>Dogrusoz</surname> <given-names>U.</given-names></name> <name><surname>Gross</surname> <given-names>B. E.</given-names></name> <name><surname>Sumer</surname> <given-names>S. O.</given-names></name> <name><surname>Aksoy</surname> <given-names>B. A.</given-names></name> <etal/></person-group>. (<year>2012</year>). <article-title>The cBio cancer genomics portal: an open platform for exploring multidimensional cancer genomics data</article-title>. <source>Cancer Discov.</source> <volume>2</volume>, <fpage>401</fpage>&#x2013;<lpage>404</lpage>. doi: <pub-id pub-id-type="doi">10.1158/2159-8290.CD-12-0095</pub-id> <comment>Erratum in: Cancer Discov. 2012 Oct;2(10):960.</comment>, PMID: <pub-id pub-id-type="pmid">22588877</pub-id></citation></ref>
<ref id="ref11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>B.</given-names></name> <name><surname>Li</surname> <given-names>N.</given-names></name> <name><surname>Bao</surname> <given-names>W.</given-names></name></person-group> (<year>2025</year>). <article-title>CLPr_in_ML: cleft lip and palate reconstructed features with machine learning</article-title>. <source>Curr. Bioinforma.</source> <volume>20</volume>:<fpage>e15748936330499</fpage>. doi: <pub-id pub-id-type="doi">10.2174/0115748936330499240909082529</pub-id></citation></ref>
<ref id="ref12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>Z. H.</given-names></name> <name><surname>Lin</surname> <given-names>L.</given-names></name> <name><surname>Wu</surname> <given-names>C. F.</given-names></name> <name><surname>Li</surname> <given-names>C. F.</given-names></name> <name><surname>Xu</surname> <given-names>R. H.</given-names></name> <name><surname>Sun</surname> <given-names>Y.</given-names></name></person-group> (<year>2021</year>). <article-title>Artificial intelligence for assisting cancer diagnosis and treatment in the era of precision medicine</article-title>. <source>Cancer Commun (Lond)</source> <volume>41</volume>, <fpage>1100</fpage>&#x2013;<lpage>1115</lpage>. doi: <pub-id pub-id-type="doi">10.1002/cac2.12215</pub-id>, PMID: <pub-id pub-id-type="pmid">34613667</pub-id></citation></ref>
<ref id="ref13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chua</surname> <given-names>I. S.</given-names></name> <name><surname>Gaziel-Yablowitz</surname> <given-names>M.</given-names></name> <name><surname>Korach</surname> <given-names>Z. T.</given-names></name> <name><surname>Kehl</surname> <given-names>K. L.</given-names></name> <name><surname>Levitan</surname> <given-names>N. A.</given-names></name> <name><surname>Arriaga</surname> <given-names>Y. E.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Artificial intelligence in oncology: path to implementation</article-title>. <source>Cancer Med.</source> <volume>10</volume>, <fpage>4138</fpage>&#x2013;<lpage>4149</lpage>. doi: <pub-id pub-id-type="doi">10.1002/cam4.3935</pub-id>, PMID: <pub-id pub-id-type="pmid">33960708</pub-id></citation></ref>
<ref id="ref14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Eralp</surname> <given-names>B.</given-names></name> <name><surname>Sefer</surname> <given-names>E.</given-names></name></person-group> (<year>2024</year>). <article-title>Reference-free inferring of transcriptomic events in cancer cells on single-cell data</article-title>. <source>BMC Cancer</source> <volume>24</volume>:<fpage>607</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12885-024-12331-5</pub-id>, PMID: <pub-id pub-id-type="pmid">38769480</pub-id></citation></ref>
<ref id="ref15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Farooqi</surname> <given-names>A. A.</given-names></name> <name><surname>de la Roche</surname> <given-names>M.</given-names></name> <name><surname>Djamgoz</surname> <given-names>M. B. A.</given-names></name> <name><surname>Siddik</surname> <given-names>Z. H.</given-names></name></person-group> (<year>2019</year>). <article-title>Overview of the oncogenic signaling pathways in colorectal cancer: mechanistic insights</article-title>. <source>Semin. Cancer Biol.</source> <volume>58</volume>, <fpage>65</fpage>&#x2013;<lpage>79</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.semcancer.2019.01.001</pub-id>, PMID: <pub-id pub-id-type="pmid">30633978</pub-id></citation></ref>
<ref id="ref16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ferrell</surname> <given-names>M.</given-names></name> <name><surname>Guven</surname> <given-names>D. C.</given-names></name> <name><surname>Gomez</surname> <given-names>C. G.</given-names></name> <name><surname>Nasrollahi</surname> <given-names>E.</given-names></name> <name><surname>Giza</surname> <given-names>R.</given-names></name> <name><surname>Cheng</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Investigating the WNT and TGF-beta pathways alterations and tumor mutant burden in young-onset colorectal cancer</article-title>. <source>Sci. Rep.</source> <volume>14</volume>:<fpage>17884</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-024-68938-y</pub-id>, PMID: <pub-id pub-id-type="pmid">39095553</pub-id></citation></ref>
<ref id="ref17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Garcia</surname> <given-names>S.</given-names></name> <name><surname>Pruitt</surname> <given-names>S. L.</given-names></name> <name><surname>Singal</surname> <given-names>A. G.</given-names></name> <name><surname>Murphy</surname> <given-names>C. C.</given-names></name></person-group> (<year>2018</year>). <article-title>Colorectal cancer incidence among Hispanics and non-Hispanic whites in the United States</article-title>. <source>Cancer Causes Control</source> <volume>29</volume>, <fpage>1039</fpage>&#x2013;<lpage>1046</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s10552-018-1077-1</pub-id>, PMID: <pub-id pub-id-type="pmid">30155605</pub-id></citation></ref>
<ref id="ref18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Goldman</surname> <given-names>M. J.</given-names></name> <name><surname>Craft</surname> <given-names>B.</given-names></name> <name><surname>Hastie</surname> <given-names>M.</given-names></name> <name><surname>Repe&#x010D;ka</surname> <given-names>K.</given-names></name> <name><surname>McDade</surname> <given-names>F.</given-names></name> <name><surname>Kamath</surname> <given-names>A.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Visualizing and interpreting cancer genomics data via the Xena platform</article-title>. <source>Nat. Biotechnol.</source> <volume>38</volume>, <fpage>675</fpage>&#x2013;<lpage>678</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41587-020-0546-8</pub-id>, PMID: <pub-id pub-id-type="pmid">32444850</pub-id></citation></ref>
<ref id="ref19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lieu</surname> <given-names>C. H.</given-names></name> <name><surname>Golemis</surname> <given-names>E. A.</given-names></name> <name><surname>Serebriiskii</surname> <given-names>I. G.</given-names></name> <name><surname>Newberg</surname> <given-names>J.</given-names></name> <name><surname>Hemmerich</surname> <given-names>A.</given-names></name> <name><surname>Connelly</surname> <given-names>C.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>Comprehensive genomic landscapes in early and later onset colorectal Cancer</article-title>. <source>Clin. Cancer Res.</source> <volume>25</volume>, <fpage>5852</fpage>&#x2013;<lpage>5858</lpage>. doi: <pub-id pub-id-type="doi">10.1158/1078-0432.CCR-19-0899</pub-id>, PMID: <pub-id pub-id-type="pmid">31243121</pub-id></citation></ref>
<ref id="ref20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mauri</surname> <given-names>G.</given-names></name> <name><surname>Sartore-Bianchi</surname> <given-names>A.</given-names></name> <name><surname>Russo</surname> <given-names>A. G.</given-names></name> <name><surname>Marsoni</surname> <given-names>S.</given-names></name> <name><surname>Bardelli</surname> <given-names>A.</given-names></name> <name><surname>Siena</surname> <given-names>S.</given-names></name></person-group> (<year>2019</year>). <article-title>Early-onset colorectal cancer in young individuals</article-title>. <source>Mol. Oncol.</source> <volume>13</volume>, <fpage>109</fpage>&#x2013;<lpage>131</lpage>. doi: <pub-id pub-id-type="doi">10.1002/1878-0261.12417</pub-id>, PMID: <pub-id pub-id-type="pmid">30520562</pub-id></citation></ref>
<ref id="ref21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Monge</surname> <given-names>C.</given-names></name> <name><surname>Waldrup</surname> <given-names>B.</given-names></name> <name><surname>Carranza</surname> <given-names>F. G.</given-names></name> <name><surname>Velazquez-Villarreal</surname> <given-names>E.</given-names></name></person-group> (<year>2024</year>). <article-title>WNT and TGF-Beta pathway alterations in early-onset colorectal Cancer among Hispanic/Latino populations</article-title>. <source>Cancers (Basel)</source> <volume>16</volume>:<fpage>3903</fpage>. doi: <pub-id pub-id-type="doi">10.3390/cancers16233903</pub-id>, PMID: <pub-id pub-id-type="pmid">39682092</pub-id></citation></ref>
<ref id="ref22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Monge</surname> <given-names>C.</given-names></name> <name><surname>Waldrup</surname> <given-names>B.</given-names></name> <name><surname>Carranza</surname> <given-names>F. G.</given-names></name> <name><surname>Velazquez-Villarreal</surname> <given-names>E.</given-names></name></person-group> (<year>2025</year>). <article-title>Molecular heterogeneity in early-onset colorectal Cancer: pathway-specific insights in high-risk populations</article-title>. <source>Cancers (Basel)</source> <volume>17</volume>:<fpage>1325</fpage>. doi: <pub-id pub-id-type="doi">10.3390/cancers17081325</pub-id>, PMID: <pub-id pub-id-type="pmid">40282501</pub-id></citation></ref>
<ref id="ref23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sanchez-Vega</surname> <given-names>F.</given-names></name> <name><surname>Mina</surname> <given-names>M.</given-names></name> <name><surname>Armenia</surname> <given-names>J.</given-names></name> <name><surname>Chatila</surname> <given-names>W. K.</given-names></name> <name><surname>Luna</surname> <given-names>A.</given-names></name> <name><surname>La</surname> <given-names>K. C.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Oncogenic signaling pathways in the Cancer genome atlas</article-title>. <source>Cell</source> <volume>173</volume>, <fpage>321</fpage>&#x2013;<lpage>337.e10</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cell.2018.03.035</pub-id>, PMID: <pub-id pub-id-type="pmid">29625050</pub-id></citation></ref>
<ref id="ref24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shimizu</surname> <given-names>H.</given-names></name> <name><surname>Nakayama</surname> <given-names>K. I.</given-names></name></person-group> (<year>2020</year>). <article-title>Artificial intelligence in oncology</article-title>. <source>Cancer Sci.</source> <volume>111</volume>, <fpage>1452</fpage>&#x2013;<lpage>1460</lpage>. doi: <pub-id pub-id-type="doi">10.1111/cas.14377</pub-id>, PMID: <pub-id pub-id-type="pmid">32133724</pub-id></citation></ref>
<ref id="ref25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sinicrope</surname> <given-names>F. A.</given-names></name></person-group> (<year>2022</year>). <article-title>Increasing incidence of early-onset colorectal Cancer</article-title>. <source>N. Engl. J. Med.</source> <volume>386</volume>, <fpage>1547</fpage>&#x2013;<lpage>1558</lpage>. doi: <pub-id pub-id-type="doi">10.1056/NEJMra2200869</pub-id>, PMID: <pub-id pub-id-type="pmid">35443109</pub-id></citation></ref>
<ref id="ref26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Song</surname> <given-names>H.</given-names></name> <name><surname>Sontz</surname> <given-names>R. A.</given-names></name> <name><surname>Vance</surname> <given-names>M. J.</given-names></name> <name><surname>Morris</surname> <given-names>J. M.</given-names></name> <name><surname>Sheriff</surname> <given-names>S.</given-names></name> <name><surname>Zhu</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>High-fat diet plus HNF1A variant promotes polyps by activating &#x03B2;-catenin in early-onset colorectal cancer</article-title>. <source>JCI Insight</source> <volume>8</volume>:<fpage>e167163</fpage>. doi: <pub-id pub-id-type="doi">10.1172/jci.insight.167163</pub-id>, PMID: <pub-id pub-id-type="pmid">37219942</pub-id></citation></ref>
<ref id="ref27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sung</surname> <given-names>H.</given-names></name> <name><surname>Ferlay</surname> <given-names>J.</given-names></name> <name><surname>Siegel</surname> <given-names>R. L.</given-names></name> <name><surname>Laversanne</surname> <given-names>M.</given-names></name> <name><surname>Soerjomataram</surname> <given-names>I.</given-names></name> <name><surname>Jemal</surname> <given-names>A.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Global Cancer statistics 2020: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries</article-title>. <source>CA Cancer J. Clin.</source> <volume>71</volume>, <fpage>209</fpage>&#x2013;<lpage>249</lpage>. doi: <pub-id pub-id-type="doi">10.3322/caac.21660</pub-id>, PMID: <pub-id pub-id-type="pmid">33538338</pub-id></citation></ref>
<ref id="ref28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Suresh</surname> <given-names>S.</given-names></name> <name><surname>Misra</surname> <given-names>S. M.</given-names></name></person-group> (<year>2024</year>). <article-title>Large language models in pediatric education: current uses and future potential</article-title>. <source>Pediatrics</source> <volume>154</volume>:<fpage>e2023064683</fpage>. doi: <pub-id pub-id-type="doi">10.1542/peds.2023-064683</pub-id>, PMID: <pub-id pub-id-type="pmid">39108227</pub-id></citation></ref>
<ref id="ref29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ullah</surname> <given-names>F.</given-names></name> <name><surname>Pillai</surname> <given-names>A. B.</given-names></name> <name><surname>Omar</surname> <given-names>N.</given-names></name> <name><surname>Dima</surname> <given-names>D.</given-names></name> <name><surname>Harichand</surname> <given-names>S.</given-names></name></person-group> (<year>2023</year>). <article-title>Early-onset colorectal Cancer: current insights</article-title>. <source>Cancers (Basel)</source> <volume>15</volume>:<fpage>3202</fpage>. doi: <pub-id pub-id-type="doi">10.3390/cancers15123202</pub-id>, PMID: <pub-id pub-id-type="pmid">37370811</pub-id></citation></ref>
<ref id="ref30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Velez-Arce</surname> <given-names>A.</given-names></name> <name><surname>Li</surname> <given-names>M. M.</given-names></name> <name><surname>Gao</surname> <given-names>W.</given-names></name> <name><surname>Lin</surname> <given-names>X.</given-names></name> <name><surname>Huang</surname> <given-names>K.</given-names></name> <name><surname>Fu</surname> <given-names>T.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Signals in the cells: multimodal and contextualized machine learning foundations for therapeutics</article-title>. <source>bioRxiv</source> [Preprint], <fpage>2024.06.12.598655</fpage>. doi: <pub-id pub-id-type="doi">10.1101/2024.06.12.598655</pub-id>, PMID: <pub-id pub-id-type="pmid">38948789</pub-id></citation></ref>
<ref id="ref31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xiao</surname> <given-names>Y.</given-names></name> <name><surname>Liu</surname> <given-names>J.</given-names></name> <name><surname>Zheng</surname> <given-names>Y.</given-names></name> <name><surname>Xie</surname> <given-names>X.</given-names></name> <name><surname>Hao</surname> <given-names>J.</given-names></name> <name><surname>Li</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>CellAgent: An LLM-driven multi-agent framework for automated single-cell data analysis</article-title>. <source>BioRxiv</source> [Preprint]. doi: <pub-id pub-id-type="doi">10.1101/2024.05.13.593861</pub-id></citation></ref>
<ref id="ref32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>E. W.</given-names></name> <name><surname>Velazquez-Villarreal</surname> <given-names>E.</given-names></name></person-group> (<year>2025</year>). <article-title>AI-HOPE: an AI-driven conversational agent for enhanced clinical and genomic data integration in precision medicine research</article-title>. <source>Bioinformatics</source> <volume>41</volume>:<fpage>btaf359</fpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btaf359</pub-id>, PMID: <pub-id pub-id-type="pmid">40577785</pub-id></citation></ref>
<ref id="ref33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>E.-W.</given-names></name> <name><surname>Waldrup</surname> <given-names>B.</given-names></name> <name><surname>Velazquez-Villarreal</surname> <given-names>E.</given-names></name></person-group> (<year>2025a</year>). <article-title>AI-HOPE-TGFbeta: a conversational AI agent for integrative clinical and genomic analysis of TGF-&#x03B2; pathway alterations in colorectal cancer to advance precision medicine</article-title>. <source>AI</source> <volume>6</volume>:<fpage>137</fpage>. doi: <pub-id pub-id-type="doi">10.3390/ai6070137</pub-id></citation></ref>
<ref id="ref34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>E.-W.</given-names></name> <name><surname>Waldrup</surname> <given-names>B.</given-names></name> <name><surname>Velazquez-Villarreal</surname> <given-names>E.</given-names></name></person-group> (<year>2025b</year>). <article-title>From mutation to prognosis: AI-HOPE-PI3K enables artificial intelligence agent-driven integration of PI3K pathway data in colorectal Cancer precision medicine</article-title>. <source>Int. J. Mol. Sci.</source> <volume>26</volume>:<fpage>6487</fpage>. doi: <pub-id pub-id-type="doi">10.3390/ijms26136487</pub-id>, PMID: <pub-id pub-id-type="pmid">40650262</pub-id></citation></ref>
<ref id="ref35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Youssef</surname> <given-names>E.</given-names></name> <name><surname>Palmer</surname> <given-names>D.</given-names></name> <name><surname>Fletcher</surname> <given-names>B.</given-names></name> <name><surname>Vaughn</surname> <given-names>R.</given-names></name></person-group> (<year>2025</year>). <article-title>Exosomes in precision oncology and beyond: from bench to bedside in diagnostics and therapeutics</article-title>. <source>Cancers (Basel)</source> <volume>17</volume>:<fpage>940</fpage>. doi: <pub-id pub-id-type="doi">10.3390/cancers17060940</pub-id>, PMID: <pub-id pub-id-type="pmid">40149276</pub-id></citation></ref>
<ref id="ref36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yuan</surname> <given-names>S.</given-names></name> <name><surname>Tao</surname> <given-names>F.</given-names></name> <name><surname>Zhang</surname> <given-names>X.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name> <name><surname>Sun</surname> <given-names>X.</given-names></name> <name><surname>Wu</surname> <given-names>D.</given-names></name></person-group> (<year>2020</year>). <article-title>Role of Wnt/<italic>&#x03B2;</italic>-catenin signaling in the Chemoresistance modulation of colorectal Cancer</article-title>. <source>Biomed. Res. Int.</source> <volume>2020</volume>:<fpage>9390878</fpage>. doi: <pub-id pub-id-type="doi">10.1155/2020/9390878</pub-id>, PMID: <pub-id pub-id-type="pmid">32258160</pub-id></citation></ref>
<ref id="ref37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>X.</given-names></name></person-group> (<year>2020</year>). <article-title>Targeting the Wnt/&#x03B2;-catenin signaling pathway in cancer</article-title>. <source>J. Hematol. Oncol.</source> <volume>13</volume>:<fpage>165</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13045-020-00990-3</pub-id>, PMID: <pub-id pub-id-type="pmid">33276800</pub-id></citation></ref>
<ref id="ref38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>Z.</given-names></name> <name><surname>Wei</surname> <given-names>X.</given-names></name></person-group> (<year>2023</year>). <article-title>Artificial intelligence-assisted selection and efficacy prediction of antineoplastic strategies for precision cancer therapy</article-title>. <source>Semin. Cancer Biol.</source> <volume>90</volume>, <fpage>57</fpage>&#x2013;<lpage>72</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.semcancer.2023.02.005</pub-id>, PMID: <pub-id pub-id-type="pmid">36796530</pub-id></citation></ref>
<ref id="ref39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhou</surname> <given-names>J.</given-names></name> <name><surname>Zhang</surname> <given-names>B.</given-names></name> <name><surname>Li</surname> <given-names>G.</given-names></name> <name><surname>Chen</surname> <given-names>X.</given-names></name> <name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Xu</surname> <given-names>X.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>An AI agent for fully automated multi-Omic analyses</article-title>. <source>Adv Sci (Weinh)</source> <volume>11</volume>:<fpage>e2407094</fpage>. doi: <pub-id pub-id-type="doi">10.1002/advs.202407094</pub-id>, PMID: <pub-id pub-id-type="pmid">39361263</pub-id></citation></ref>
</ref-list>
</back>
</article>