<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Archiving and Interchange DTD v2.3 20070202//EN" "archivearticle.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="systematic-review" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Artif. Intell.</journal-id>
<journal-title>Frontiers in Artificial Intelligence</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Artif. Intell.</abbrev-journal-title>
<issn pub-type="epub">2624-8212</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/frai.2025.1649746</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Artificial Intelligence</subject>
<subj-group>
<subject>Systematic Review</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Artificial intelligence for ovarian cancer diagnosis via ultrasound: a systematic review and quantitative assessment of model performance</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Garcia-Atutxa</surname>
<given-names>Igor</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn0003"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2778734/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Villanueva-Flores</surname>
<given-names>Francisca</given-names>
</name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn0003"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2778636/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Barrio</surname>
<given-names>Ekaitz Dudagotia</given-names>
</name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="author-notes" rid="fn0003"><sup>&#x2020;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Sanchez-Villamil</surname>
<given-names>Javier I.</given-names>
</name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn0003"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/360870/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Mart&#x00ED;nez-M&#x00E1;s</surname>
<given-names>Jos&#x00E9;</given-names>
</name>
<xref rid="aff4" ref-type="aff"><sup>4</sup></xref>
<xref ref-type="author-notes" rid="fn0003"><sup>&#x2020;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Bueno-Crespo</surname>
<given-names>Andr&#x00E9;s</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<xref ref-type="author-notes" rid="fn0003"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/414833/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Escuela Polit&#x00E9;cnica Superior, Universidad Cat&#x00F3;lica de Murcia (UCAM)</institution>, <addr-line>Murcia</addr-line>, <country>Spain</country></aff>
<aff id="aff2"><sup>2</sup><institution>Centro de Investigaci&#x00F3;n en Ciencia Aplicada y Tecnolog&#x00ED;a Avanzada, (CICATA) Unidad Morelos del Instituto Polit&#x00E9;cnica Nacional (IPN)</institution>, <addr-line>Xochitepec</addr-line>, <country>Mexico</country></aff>
<aff id="aff3"><sup>3</sup><institution>University of Murcia</institution>, <addr-line>Murcia</addr-line>, <country>Spain</country></aff>
<aff id="aff4"><sup>4</sup><institution>Facultad de Medicina, Universidad Cat&#x00F3;lica de Murcia (UCAM)</institution>, <addr-line>Murcia</addr-line>, <country>Spain</country></aff>
<author-notes>
<fn fn-type="edited-by" id="fn0001">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/588118/overview">Tim Hulsen</ext-link>, Rotterdam University of Applied Sciences, Netherlands</p>
</fn>
<fn fn-type="edited-by" id="fn0002">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/796734/overview">Wenjing Zhu</ext-link>, University of Health and Rehabilitation Sciences (Qingdao Municipal Hospital), China</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3116252/overview">U&#x011F;urcan Zorlu</ext-link>, Yuksek Ihtisas Training and Research Hospital, T&#x00FC;rkiye</p>
</fn>
<corresp id="c001">&#x002A;Correspondence: Andr&#x00E9;s Bueno-Crespo, <email>abueno@ucam.edu</email></corresp>
<fn fn-type="other" id="fn0003"><p><sup>&#x2020;</sup>ORCID: Igor Garcia-Atutxa, <ext-link ext-link-type="uri" xlink:href="https://orcid.org/0009-0002-1551-2685">orcid.org/0009-0002-1551-2685</ext-link></p>
<p>Francisca Villanueva-Flores, <ext-link ext-link-type="uri" xlink:href="https://orcid.org/0000-0001-6092-4211">orcid.org/0000-0001-6092-4211</ext-link></p>
<p>Ekaitz Dudagotia Barrio, <ext-link ext-link-type="uri" xlink:href="https://orcid.org/0000-0003-0990-3081">orcid.org/0000-0003-0990-3081</ext-link></p>
<p>Javier I. Sanchez-Villamil, <ext-link ext-link-type="uri" xlink:href="https://orcid.org/0000-0003-4928-5994">orcid.org/0000-0003-4928-5994</ext-link></p>
<p>Jos&#x00E9; Mart&#x00ED;nez-M&#x00E1;s, <ext-link ext-link-type="uri" xlink:href="https://orcid.org/0000-0002-8506-9933">orcid.org/0000-0002-8506-9933</ext-link></p>
<p>Andr&#x00E9;s Bueno-Crespo, <ext-link ext-link-type="uri" xlink:href="https://orcid.org/0000-0003-1734-6852">orcid.org/0000-0003-1734-6852</ext-link></p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>05</day>
<month>11</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>8</volume>
<elocation-id>1649746</elocation-id>
<history>
<date date-type="received">
<day>18</day>
<month>06</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>20</day>
<month>10</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2025 Garcia-Atutxa, Villanueva-Flores, Barrio, Sanchez-Villamil, Mart&#x00ED;nez-M&#x00E1;s and Bueno-Crespo.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Garcia-Atutxa, Villanueva-Flores, Barrio, Sanchez-Villamil, Mart&#x00ED;nez-M&#x00E1;s and Bueno-Crespo</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec id="sec1">
<title>Background</title>
<p>Early and accurate detection of ovarian cancer (OC) remains clinically challenging, prompting exploration of artificial intelligence (AI)-based ultrasound diagnostics. This systematic review and meta-analysis critically evaluate diagnostic accuracy, methodological rigor, and clinical applicability of AI models for ovarian mass classification using B-mode ultrasound.</p>
</sec>
<sec id="sec2">
<title>Methods</title>
<p>A systematic literature search following PRISMA guidelines was conducted in PubMed, IEEE Xplore, and Scopus up to December 2024. Eligible studies included AI-based ovarian mass classification using B-mode ultrasound, reporting accuracy, sensitivity, specificity, and/or area under the ROC curve (AUC). Data extraction, quality assessment (PROBAST), and meta-analysis (random effects) were independently performed by two reviewers. Heterogeneity sources were explored.</p>
</sec>
<sec id="sec3">
<title>Results</title>
<p>From 823 identified records, 44 studies met inclusion criteria, covering over 650,000 images. Pooled performance metrics indicated high accuracy (92.3%), sensitivity (91.6%), specificity (90.1%), and AUC (0.93). Automated segmentation significantly outperformed manual segmentation in accuracy and sensitivity, demonstrating standardization benefits and reduced observer variability. Dataset size minimally correlated with performance, highlighting methodological rigor as a primary determinant. No specific AI architecture consistently outperformed others. Substantial methodological heterogeneity and frequent risk-of-bias issues (limited validation, small datasets) currently limit clinical translation.</p>
</sec>
<sec id="sec4">
<title>Conclusion</title>
<p>AI models show promising diagnostic performance for OC ultrasound imaging. However, addressing methodological challenges, including rigorous validation, standardized reporting (TRIPOD-AI, STARD-AI), and prospective multicenter studies, is essential for clinical integration. This review provides clear recommendations to enhance clinical translation of AI-based ultrasound diagnostics.</p>
</sec>
</abstract>
<abstract abstract-type="graphical">
<title>Graphical abstract</title>
<p><graphic xlink:href="frai-08-1649746-gr0001.tif" mimetype="image" mime-subtype="tiff"><alt-text content-type="machine-generated">B-mode ultrasound images show ovarian tumors in original, manual, and automatic segmentation. A comparison between expert diagnosis and artificial intelligence highlights AI's accuracy, sensitivity, specificity, and AUC. Illustrations depict healthy, early, and advanced tumor stages, with AI symbols like a magnifying glass, network, and brain.</alt-text></graphic></p>
</abstract>
<kwd-group>
<kwd>systematic review</kwd>
<kwd>meta-analysis</kwd>
<kwd>artificial intelligence</kwd>
<kwd>ultrasound</kwd>
<kwd>ovarian cancer</kwd>
<kwd>early detection</kwd>
<kwd>deep learning</kwd>
</kwd-group>
<counts>
<fig-count count="9"/>
<table-count count="4"/>
<equation-count count="0"/>
<ref-count count="80"/>
<page-count count="17"/>
<word-count count="11078"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Medicine and Public Health</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec5">
<label>1</label>
<title>Introduction</title>
<p>Ovarian cancer (OC) is the most lethal gynecological neoplasm and the fifth leading cause of cancer-related mortality in women (<xref ref-type="bibr" rid="ref17">Dalmartello et al., 2022</xref>; <xref ref-type="bibr" rid="ref66">Siegel et al., 2021</xref>). The incidence of OC in the USA is estimated to be 10.2 cases, and the mortality rate is 6.0 deaths per 100,000 women per year, indicating approximately 1.1% lifetime risk for women (<xref ref-type="bibr" rid="ref52">NIH, 2020</xref>). Despite advances in diagnosis and treatment, the mortality rate has not shown a significant decline over the past three decades, primarily due to the challenges in early detection and limited therapeutic efficacy in advanced-stage disease (<xref ref-type="bibr" rid="ref8">Badgwell and Bast, 2007</xref>; <xref ref-type="bibr" rid="ref30">Jacobs and Menon, 2004</xref>; <xref ref-type="bibr" rid="ref9">Bast et al., 2007</xref>; <xref ref-type="bibr" rid="ref72">Torre et al., 2018</xref>). Currently, 70% of OC cases are diagnosed at advanced stages, where five-year survival drastically drops to 20%&#x2013;30%, in contrast to 80%&#x2013;95% survival when detected at early stages (<xref ref-type="bibr" rid="ref11">Bowtell et al., 2015</xref>). Therefore, improving early-stage detection methods is critically important to enhance patient outcomes.</p>
<p>Transvaginal ultrasound (TVS), computed tomography (CT), and magnetic resonance imaging (MRI) are the primary imaging modalities for OC detection. TVS is particularly advantageous as a non-invasive, cost-effective, accessible, and real-time imaging method, allowing assessment of ovarian masses&#x2019; size, shape, and internal structures (e.g., septa, solid tissue), aiding differentiation between benign and malignant tumors. However, the limited resolution of TVS may fail to detect small or early-stage tumors, and overlapping anatomical structures, such as bowel loops or normal ovarian tissue, complicate mass differentiation. Moreover, specific OC subtypes do not exhibit significant morphological changes in early phases, reducing sensitivity (<xref ref-type="bibr" rid="ref76">Wu et al., 2018</xref>; <xref ref-type="bibr" rid="ref61">Rosati et al., 2020</xref>).</p>
<p>Despite these limitations, TVS remains indispensable in the initial OC diagnosis due to accessibility and low cost. However, interpretation often varies significantly with radiologist experience, resulting in diagnostic inconsistencies and clinical errors (<xref ref-type="bibr" rid="ref10">B&#x00E4;umler et al., 2020</xref>; <xref ref-type="bibr" rid="ref51">Nebgen et al., 2019</xref>). These issues underscore the critical need for standardized, objective, and automated diagnostic methods that enhance accuracy and reduce inter-observer variability.</p>
<p>Artificial intelligence (AI) integration has significantly advanced medical imaging diagnostics, improving tumor identification accuracy and consistency. Convolutional neural networks (CNNs), a sophisticated deep learning (DL) architecture, have demonstrated over 90% accuracy in extracting complex TVS image features and classifying ovarian malignancy in several studies (<xref ref-type="bibr" rid="ref4">Akazawa and Hashimoto, 2021</xref>; <xref ref-type="bibr" rid="ref67">Sone et al., 2021</xref>). Beyond accuracy, AI reduces human interpretation errors and enables the analysis of large datasets (<xref ref-type="bibr" rid="ref21">Falana et al., 2023</xref>; <xref ref-type="bibr" rid="ref63">Sahu and Shrivastava, 2023</xref>).</p>
<p>However, several challenges hinder the clinical translation of AI in OC detection. Crucially, existing DL models suffer from inadequate dataset representativeness, as most research uses datasets from single institutions, leading to population biases. AI model performance notably declines when tested on populations with different ethnic, geographic, or technological characteristics (<xref ref-type="bibr" rid="ref54">Noseworthy et al., 2020</xref>). Additionally, heterogeneity in TVS image quality, formats, resolution, and acquisition protocols across institutions further impairs AI model reproducibility and generalizability (<xref ref-type="bibr" rid="ref58">Raciti et al., 2023</xref>).</p>
<p>A significant barrier is the absence of robust prospective clinical validation. Most AI algorithms have been validated retrospectively, limiting insights into their real-time clinical applicability (<xref ref-type="bibr" rid="ref58">Raciti et al., 2023</xref>). Furthermore, lack of standardized annotation and segmentation protocols significantly impacts AI model accuracy, with manual segmentation inconsistencies affecting performance by up to 20% (<xref ref-type="bibr" rid="ref26">Heinlein et al., 2024</xref>; <xref ref-type="bibr" rid="ref27">Ho et al., 2022</xref>). The absence of international consortia, standardized benchmarking, and sufficiently large, diverse, open-access TVS image databases also restrict the comparative evaluation and robust training of AI models. While initiatives like The Cancer Imaging Archive (TCIA) have addressed similar needs in other cancer areas, a parallel effort for OC is currently lacking (<xref ref-type="bibr" rid="ref53">NIH, n.d.</xref>).</p>
<p>This systematic review and quantitative meta-analysis address these critical knowledge gaps by evaluating the diagnostic performance of AI models applied specifically to B-mode TVS images for early OC detection. Through a comprehensive comparison of accuracy, sensitivity, specificity, and area under the curve (AUC) across CNNs, classical machine learning algorithms, and transformer-based models, the study assesses how methodological factors, such as segmentation and dataset size, influence model performance. Clarifying these factors is expected to enhance clinical practice directly by guiding the development of robust, standardized AI tools capable of improving early OC diagnosis, thereby increasing patient survival rates and clinical outcomes.</p>
</sec>
<sec sec-type="methods" id="sec6">
<label>2</label>
<title>Methodology</title>
<p>This study was designed and conducted following the PRISMA 2020 guidelines (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) (<xref ref-type="bibr" rid="ref37">Liberati et al., 2009</xref>; <xref ref-type="bibr" rid="ref55">Page et al., 2021</xref>) to ensure transparency, reproducibility, and comprehensiveness in the systematic review and meta-analysis (<xref rid="SM1" ref-type="supplementary-material">Supplementary Tables S1, S2</xref>). The methodological protocol included a predefined search strategy, explicit eligibility criteria, risk of bias assessment, and statistical analysis of the extracted data. Specifically, the systematic review was guided by the following research questions:</p>
<list list-type="bullet">
<list-item>
<p>What is the diagnostic accuracy (accuracy, sensitivity, specificity, and AUC) of AI-based models for ovarian mass classification using B-mode ultrasound?</p>
</list-item>
<list-item>
<p>Which methodological factors, such as segmentation methodology (automatic vs. manual), dataset size, AI model architecture, and risk of bias significantly influence the diagnostic performance of AI models?</p>
</list-item>
</list>
<sec id="sec7">
<label>2.1</label>
<title>Search strategy</title>
<p>In January 2025, a comprehensive search was conducted in three high-impact scientific databases: PubMed, IEEE Xplore, and Scopus. The search strategy included the following terms combined using Boolean operators: (&#x201C;machine learning&#x201D; OR &#x201C;artificial intelligence&#x201D; OR &#x201C;deep learning&#x201D; OR &#x201C;neural network&#x201D;) AND (&#x201C;ovarian cancer&#x201D; OR &#x201C;ovarian tumor&#x201D;) AND &#x201C;ultrasound.&#x201D; No language or publication type restrictions were applied during the initial search.</p>
</sec>
<sec id="sec8">
<label>2.2</label>
<title>Eligibility criteria</title>
<p>The following inclusion and exclusion criteria were explicitly defined to ensure transparency and reproducibility in the systematic selection of studies (see <xref ref-type="table" rid="tab1">Table 1</xref>).</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>Inclusion and exclusion criteria for study selection.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Inclusion criteria</th>
<th align="left" valign="top">Exclusion criteria</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Original research articles evaluating AI models</td>
<td align="left" valign="top">Systematic reviews, meta-analyses, letters to the editor, or abstracts from conferences</td>
</tr>
<tr>
<td align="left" valign="top">Studies utilizing 2D B-mode transvaginal ultrasound (TVS) images</td>
<td align="left" valign="top">Studies employing imaging modalities other than ultrasound (e.g., CT, MRI)</td>
</tr>
<tr>
<td align="left" valign="top">Studies involving the detection or classification of ovarian cancer in humans</td>
<td align="left" valign="top">Studies exclusively focused on serological biomarkers, genomic analyses, or animal models</td>
</tr>
<tr>
<td align="left" valign="top">Studies reporting at least one performance metric (accuracy, sensitivity, specificity, or AUC)</td>
<td align="left" valign="top">Studies without accessible full text or not reporting any relevant performance metric</td>
</tr>
<tr>
<td align="left" valign="top">Studies based on real patient data</td>
<td align="left" valign="top">Purely theoretical studies without clinical validation</td>
</tr>
<tr>
<td align="left" valign="top">Full-text articles published in English or Spanish</td>
<td align="left" valign="top">Studies published in languages other than English or Spanish</td>
</tr>
<tr>
<td align="left" valign="top">Studies published up to December 2024</td>
<td align="left" valign="top">Studies published after December 2024</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Studies meeting all inclusion criteria and none of the exclusion criteria were eligible for inclusion in this systematic review and meta-analysis.</p>
</sec>
<sec id="sec9">
<label>2.3</label>
<title>Study selection process</title>
<p>Two independent reviewers (IGA and FVF) initially evaluated the title and abstract of each article identified through the database search, applying the inclusion and exclusion criteria explicitly defined in Section 2.2. This preliminary assessment allowed for the exclusion of clearly irrelevant or ineligible studies. In cases of discrepancies during this initial stage, a third reviewer (EDB) was consulted to reach consensus. Subsequently, the full texts of the preselected articles were reviewed again by both reviewers (IGA and FVF) to confirm their definitive eligibility for inclusion in the quantitative analysis.</p>
</sec>
<sec id="sec10">
<label>2.4</label>
<title>Data extraction</title>
<p>The following variables were extracted from each study: author, year, type of segmentation, model architecture, model name, image dataset size, type of ovarian masses, number of classes, and performance metrics (accuracy, sensitivity, specificity, and AUC). For studies reporting multiple models, the one with the best overall performance was selected to avoid data duplication. The information was systematized into a structured database for subsequent statistical analysis.</p>
</sec>
<sec id="sec11">
<label>2.5</label>
<title>Risk of bias assessment</title>
<p>The methodological quality of the included studies was assessed using the PROBAST tool (Prediction model Risk of Bias Assessment Tool) (<xref ref-type="bibr" rid="ref75">Wolff et al., 2019</xref>), which evaluates the risk of bias and applicability in studies that develop or validate prediction models. PROBAST comprises 20 items grouped into four domains: (i) participant selection, (ii) predictors, (iii) outcomes, and (iv) statistical analysis. Two reviewers (IGA and FVF) independently performed this evaluation. Discrepancies were resolved by consensus. A detailed assessment of the 20 PROBAST items for each study and domain-specific classifications is included as <xref rid="SM1" ref-type="supplementary-material">Supplementary Tables S3, S4</xref>.</p>
</sec>
<sec id="sec12">
<label>2.6</label>
<title>Statistical analysis</title>
<sec id="sec13">
<label>2.6.1</label>
<title>Descriptive statistics and distribution assessment</title>
<p>Descriptive statistics were calculated for performance metrics, including accuracy, sensitivity, specificity, and AUC, and are reported as means, standard deviations, and ranges. The Shapiro&#x2013;Wilk test was used to assess the normality of distributions, while Levene&#x2019;s test was applied to evaluate the homogeneity of variances.</p>
<p>Because F1-score was rarely reported and often lacked the underlying confusion matrix, we did not meta-analyze F1. For interpretability, accuracy, sensitivity, specificity, and AUC remained our primary endpoints.</p>
</sec>
<sec id="sec14">
<label>2.6.2</label>
<title>Comparison between segmentation methods (automatic vs. manual)</title>
<p>Given the presence of non-normal distributions and limited subgroup sizes, non-parametric tests were prioritized to enhance statistical validity. Specifically, a Mann&#x2013;Whitney U test was used to compare accuracy between automatic and manual segmentation strategies.</p>
</sec>
<sec id="sec15">
<label>2.6.3</label>
<title>Comparison across AI model architectures</title>
<p>Differences in accuracy across AI architecture categories (e.g., CNN, ML, ANN) were assessed using a Kruskal&#x2013;Wallis H test. Additionally, performance variation between DL models (e.g., CNNs) and classical machine learning approaches was evaluated using one-way analysis of variance (ANOVA).</p>
</sec>
<sec id="sec16">
<label>2.6.4</label>
<title>Correlation between dataset size and diagnostic performance</title>
<p>The relationship between dataset size and diagnostic performance was explored using Pearson&#x2019;s correlation, excluding studies with more than 5,000 images to mitigate the influence of extreme values.</p>
</sec>
<sec id="sec17">
<label>2.6.5</label>
<title>Meta-regression analysis of methodological factors</title>
<p>A meta-regression analysis was performed using ordinary least squares (OLS) modeling to investigate the combined influence of methodological variables on diagnostic performance. Accuracy was modeled as the dependent variable, and key predictors included dataset size, segmentation type (automatic vs. manual), model architecture (CNN vs. other), and risk of bias (high vs. low). The regression included 26 studies with complete data and demonstrated that segmentation type was a significant predictor of accuracy (<italic>&#x03B2;</italic>&#x202F;=&#x202F;0.0656, <italic>p</italic>&#x202F;=&#x202F;0.007), while the other covariates did not reach statistical significance. The model explained approximately 32% of the variance in accuracy (adjusted <italic>R</italic><sup>2</sup>&#x202F;=&#x202F;0.32), supporting the relevance of segmentation quality as a determinant of AI model performance.</p>
</sec>
<sec id="sec18">
<label>2.6.6</label>
<title>Subgroup and sensitivity analyses</title>
<p>Subgroup analyses were conducted based on risk of bias (assessed by PROBAST), and a sensitivity analysis was performed by excluding studies rated as high risk to determine the robustness of findings.</p>
</sec>
<sec id="sec19">
<label>2.6.7</label>
<title>Software and reproducibility</title>
<p>All statistical analyses were conducted using Python (v3.12), leveraging the pandas, numpy, scipy, statsmodels, matplotlib, and seaborn libraries. Complete analysis code and data visualizations are available upon request.</p>
<p>All figures include concise alternative text in the captions, and a separate <xref rid="SM1" ref-type="supplementary-material">Supplementary material</xref> provides long textual descriptions.</p>
</sec>
</sec>
</sec>
<sec sec-type="results" id="sec20">
<label>3</label>
<title>Results</title>
<p>The systematic search in the PubMed, IEEE Xplore, and Scopus databases yielded 823 studies. After removing 58 duplicates, 765 titles and abstracts were screened. Of these, 686 were excluded for not meeting the inclusion criteria, resulting in 79 articles for full-text review. Finally, 44 studies were included in the quantitative analysis (<xref ref-type="fig" rid="fig1">Figure 1</xref>).</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>PRISMA flow diagram of our study. The figure illustrates the study selection process following PRISMA 2020 guidelines. A total of 823 records were identified through three databases (PubMed, IEEE Xplore, and Scopus). After removing 58 duplicates, 765 titles and abstracts were screened, excluding 686 studies that did not meet the eligibility criteria. Seventy-nine full-text articles were assessed for inclusion, of which 35 were excluded for using non-ultrasound imaging modalities (e.g., CT or MRI), focusing exclusively on segmentation methods, or lacking histopathological validation. Ultimately, 44 studies were included in the final quantitative analysis.</p>
</caption>
<graphic xlink:href="frai-08-1649746-g001.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Flowchart detailing the study selection process for a systematic review. Identification phase: 823 records from PubMed (177), IEEE (52), and Scopus (594) are identified. Screening phase: 58 duplicates removed, 765 abstracts reviewed; 686 records excluded based on title and abstract. Full-text review: 79 articles, with 35 excluded for specific criteria, resulting in 44 studies included in the systematic review.</alt-text>
</graphic>
</fig>
<p>The studies cover a period up to December 2024. Collectively, they analyzed over 650,000 B-mode TVS images for ovarian mass classification using various AI models. Most studies (<italic>n</italic>&#x202F;=&#x202F;27; 61.4%) used automatic segmentation, while the remainder (<italic>n</italic>&#x202F;=&#x202F;17; 38.6%) employed manual segmentation. The predominant architectures were CNNs, followed by classical ML algorithms, conventional artificial neural networks (ANNs), and transformer-based architectures that have emerged in recent years (<xref ref-type="table" rid="tab2">Table 2</xref>).</p>
<table-wrap position="float" id="tab2">
<label>Table 2</label>
<caption>
<p>List of the 44 articles analyzed.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Id</th>
<th align="left" valign="top">References</th>
<th align="center" valign="top">Year</th>
<th align="left" valign="top">Segmentation</th>
<th align="left" valign="top">Algorithm architecture</th>
<th align="left" valign="top">Artificial intelligence model</th>
<th align="center" valign="top">Size of dataset</th>
<th align="left" valign="top">Type of masses</th>
<th align="center" valign="top">Classes</th>
<th align="center" valign="top">Accuracy</th>
<th align="center" valign="top">Sensitivity</th>
<th align="center" valign="top">Specificity</th>
<th align="center" valign="top">AUC</th>
<th align="center" valign="top">Risk of bias</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">1</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref59">Ravishankar et al. (2023)</xref>
</td>
<td align="center" valign="top">2023</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">OCD-FCNN</td>
<td align="center" valign="top">440</td>
<td align="left" valign="top">Cysts</td>
<td align="center" valign="top">8</td>
<td align="center" valign="top">0.984</td>
<td align="center" valign="top">0.97</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">High</td>
</tr>
<tr>
<td align="left" valign="top">2</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref35">Li et al. (2022)</xref>
</td>
<td align="center" valign="top">2022</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">LKResNet-18</td>
<td align="center" valign="top">5,714</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">3</td>
<td align="center" valign="top">0.9145</td>
<td align="center" valign="top">0.918</td>
<td align="center" valign="top">0.918</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">3</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref22">Fan et al. (2023)</xref>
</td>
<td align="center" valign="top">2023</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">Ocys-Net</td>
<td align="center" valign="top">750</td>
<td align="left" valign="top">Cysts</td>
<td align="center" valign="top">3</td>
<td align="center" valign="top">0.955</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.885</td>
<td align="center" valign="top">Unclear</td>
</tr>
<tr>
<td align="left" valign="top">4</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref5">Al-karawi et al. (2021)</xref>
</td>
<td align="center" valign="top">2021</td>
<td align="left" valign="top">Manual</td>
<td align="left" valign="top">ML</td>
<td align="left" valign="top">SVM</td>
<td align="center" valign="top">242</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">3</td>
<td align="center" valign="top">0.8058</td>
<td align="center" valign="top">0.8104</td>
<td align="center" valign="top">0.8022</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">5</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref56">Patil et al. (2024)</xref>
</td>
<td align="center" valign="top">2024</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">ML</td>
<td align="left" valign="top">RF</td>
<td align="center" valign="top">187</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">3</td>
<td align="center" valign="top">0.86</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">Unclear</td>
</tr>
<tr>
<td align="left" valign="top">6</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref33">Kiruthika et al. (2023)</xref>
</td>
<td align="center" valign="top">2023</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">ML</td>
<td align="left" valign="top">SVM</td>
<td align="center" valign="top">630</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">3</td>
<td align="center" valign="top">0.965</td>
<td align="center" valign="top">0.96</td>
<td align="center" valign="top">0.955</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">7</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref73">Wang et al. (2021)</xref>
</td>
<td align="center" valign="top">2021</td>
<td align="left" valign="top">Manual</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">ResNet-34</td>
<td align="center" valign="top">279</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">3</td>
<td align="center" valign="top">0.914</td>
<td align="center" valign="top">0.914</td>
<td align="center" valign="top">0.914</td>
<td align="center" valign="top">0.963</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">8</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref65">Shih-Tien et al. (2022)</xref>
</td>
<td align="center" valign="top">2022</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">ML</td>
<td align="left" valign="top">EL</td>
<td align="center" valign="top">1896</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.9215</td>
<td align="center" valign="top">0.9137</td>
<td align="center" valign="top">0.9292</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">9</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref45">Meijing et al. (2023)</xref>
</td>
<td align="center" valign="top">2023</td>
<td align="left" valign="top">Manual</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">ResNext50</td>
<td align="center" valign="top">1,142</td>
<td align="left" valign="top">Cysts</td>
<td align="center" valign="top">7</td>
<td align="center" valign="top">0.952</td>
<td align="center" valign="top">0.895</td>
<td align="center" valign="top">0.992</td>
<td align="center" valign="top">0.997</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">10</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref12">Chen et al. (2022)</xref>
</td>
<td align="center" valign="top">2022</td>
<td align="left" valign="top">Manual</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">ResNet-18</td>
<td align="center" valign="top">422</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.92</td>
<td align="center" valign="top">0.85</td>
<td align="center" valign="top">0.93</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">11</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref23">Gao et al. (2022)</xref>
</td>
<td align="center" valign="top">2022</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">DenseNet-121</td>
<td align="center" valign="top">575,930</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.888</td>
<td align="center" valign="top">0.789</td>
<td align="center" valign="top">0.932</td>
<td align="center" valign="top">0.911</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">12</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref78">Xiang et al. (2024)</xref>
</td>
<td align="center" valign="top">2024</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">ML</td>
<td align="left" valign="top">EL</td>
<td align="center" valign="top">3,972</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.876</td>
<td align="center" valign="top">0.973</td>
<td align="center" valign="top">0.741</td>
<td align="center" valign="top">0.97</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">13</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref19">Du et al. (2024)</xref>
</td>
<td align="center" valign="top">2024</td>
<td align="left" valign="top">Manual</td>
<td align="left" valign="top">ANN</td>
<td align="left" valign="top">DLRN</td>
<td align="center" valign="top">849</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.871</td>
<td align="center" valign="top">0.733</td>
<td align="center" valign="top">0.880</td>
<td align="center" valign="top">0.928</td>
<td align="center" valign="top">Unclear</td>
</tr>
<tr>
<td align="left" valign="top">14</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref47">Miao et al. (2024)</xref>
</td>
<td align="center" valign="top">2024</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">ConvNeXt</td>
<td align="center" valign="top">575</td>
<td align="left" valign="top">Cysts</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.90</td>
<td align="center" valign="top">0.90</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.90</td>
<td align="center" valign="top">Unclear</td>
</tr>
<tr>
<td align="left" valign="top">15</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref6">Alwan et al. (2023)</xref>
</td>
<td align="center" valign="top">2023</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">CNN</td>
<td align="center" valign="top">196</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.9897</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">High</td>
</tr>
<tr>
<td align="left" valign="top">16</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref44">Mart&#x00ED;nez-M&#x00E1;s et al. (2019)</xref>
</td>
<td align="center" valign="top">2019</td>
<td align="left" valign="top">Manual</td>
<td align="left" valign="top">ML</td>
<td align="left" valign="top">SVM</td>
<td align="center" valign="top">187</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.8770</td>
<td align="center" valign="top">0.91</td>
<td align="center" valign="top">0.83</td>
<td align="center" valign="top">0.8740</td>
<td align="center" valign="top">Unclear</td>
</tr>
<tr>
<td align="left" valign="top">17</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref2">Acharya et al. (2014)</xref>
</td>
<td align="center" valign="top">2014</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">ANN</td>
<td align="left" valign="top">PNN</td>
<td align="center" valign="top">2,600</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.9981</td>
<td align="center" valign="top">0.9992</td>
<td align="center" valign="top">0.9969</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">High</td>
</tr>
<tr>
<td align="left" valign="top">18</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref29">Hussein et al. (2020)</xref>
</td>
<td align="center" valign="top">2020</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">FDA</td>
<td align="left" valign="top">Viola-Jones</td>
<td align="center" valign="top">125</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.9484</td>
<td align="center" valign="top">0.9696</td>
<td align="center" valign="top">0.9032</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">Unclear</td>
</tr>
<tr>
<td align="left" valign="top">19</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref28">Hussein et al. (2022)</xref>
</td>
<td align="center" valign="top">2021</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">ANN</td>
<td align="left" valign="top">ANN</td>
<td align="center" valign="top">250</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.9587</td>
<td align="center" valign="top">0.9701</td>
<td align="center" valign="top">0.9333</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">Unclear</td>
</tr>
<tr>
<td align="left" valign="top">20</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref3">Acharya et al. (2014)</xref>
</td>
<td align="center" valign="top">2014</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">ANN</td>
<td align="left" valign="top">PNN</td>
<td align="center" valign="top">2,600</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">1.00</td>
<td align="center" valign="top">1.00</td>
<td align="center" valign="top">1.00</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">High</td>
</tr>
<tr>
<td align="left" valign="top">21</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref31">Jeevitha and Priya (2022)</xref>
</td>
<td align="center" valign="top">2022</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">ML</td>
<td align="left" valign="top">SVM</td>
<td align="center" valign="top">100</td>
<td align="left" valign="top">Cysts</td>
<td align="center" valign="top">3</td>
<td align="center" valign="top">0.985</td>
<td align="center" valign="top">0.940</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">Unclear</td>
</tr>
<tr>
<td align="left" valign="top">22</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref74">Wang et al. (2024)</xref>
</td>
<td align="center" valign="top">2024</td>
<td align="left" valign="top">Manual</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">ResNet-50</td>
<td align="center" valign="top">1,054</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.9476</td>
<td align="center" valign="top">0.9428</td>
<td align="center" valign="top">0.9500</td>
<td align="center" valign="top">0.984</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">23</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref50">Narmatha et al. (2023)</xref>
</td>
<td align="center" valign="top">2023</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">RNN</td>
<td align="left" valign="top">Deep Q-Network</td>
<td align="center" valign="top">478</td>
<td align="left" valign="top">Cysts</td>
<td align="center" valign="top">7</td>
<td align="center" valign="top">0.96</td>
<td align="center" valign="top">0.96</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">Unclear</td>
</tr>
<tr>
<td align="left" valign="top">24</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref80">Yuyeon et al. (2022)</xref>
</td>
<td align="center" valign="top">2022</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">DenseNet161</td>
<td align="center" valign="top">1,613</td>
<td align="left" valign="top">Cysts</td>
<td align="center" valign="top">5</td>
<td align="center" valign="top">0.9012</td>
<td align="center" valign="top">0.8667</td>
<td align="center" valign="top">0.9185</td>
<td align="center" valign="top">0.9406</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">25</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref57">Pham and Le (2024)</xref>
</td>
<td align="center" valign="top">2024</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">YOLOv8</td>
<td align="center" valign="top">1,469</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">8</td>
<td align="center" valign="top">0.9126</td>
<td align="center" valign="top">0.8330</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">26</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref34">Kongara et al. (2024)</xref>
</td>
<td align="center" valign="top">2024</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">CNN</td>
<td align="center" valign="top">3,280</td>
<td align="left" valign="top">Cysts</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.9918</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">Unclear</td>
</tr>
<tr>
<td align="left" valign="top">27</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref36">Li et al. (2024)</xref>
</td>
<td align="center" valign="top">2024</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">PMFFNet</td>
<td align="center" valign="top">1,469</td>
<td align="left" valign="top">Cysts</td>
<td align="center" valign="top">7</td>
<td align="center" valign="top">0.9724</td>
<td align="center" valign="top">0.9855</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">28</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref48">Miao et al. (2023)</xref>
</td>
<td align="center" valign="top">2023</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">ResNet-34</td>
<td align="center" valign="top">1,130</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.97</td>
<td align="center" valign="top">0.93</td>
<td align="center" valign="top">0.95</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">29</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref49">Moro et al. (2024)</xref>
</td>
<td align="center" valign="top">2024</td>
<td align="left" valign="top">Manual</td>
<td align="left" valign="top">ML</td>
<td align="left" valign="top">RF</td>
<td align="center" valign="top">775</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.99</td>
<td align="center" valign="top">0.64</td>
<td align="center" valign="top">0.88</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">30</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref13">Chiappa et al. (2021)</xref>
</td>
<td align="center" valign="top">2020</td>
<td align="left" valign="top">Manual</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">CNN</td>
<td align="center" valign="top">241</td>
<td align="left" valign="top">Cysts</td>
<td align="center" valign="top">3</td>
<td align="center" valign="top">0.83</td>
<td align="center" valign="top">0.78</td>
<td align="center" valign="top">0.85</td>
<td align="center" valign="top">0.88</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">31</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref77">Xi et al. (2023)</xref>
</td>
<td align="center" valign="top">2023</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">DenseNet</td>
<td align="center" valign="top">1,103</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.964</td>
<td align="center" valign="top">0.997</td>
<td align="center" valign="top">0.952</td>
<td align="center" valign="top">0.973</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">32</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref69">&#x0218;tefan et al. (2021)</xref>
</td>
<td align="center" valign="top">2021</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">ML</td>
<td align="left" valign="top">KNN</td>
<td align="center" valign="top">123</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.9048</td>
<td align="center" valign="top">0.931</td>
<td align="center" valign="top">0.951</td>
<td align="center" valign="top">Unclear</td>
</tr>
<tr>
<td align="left" valign="top">33</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref14">Christiansen et al. (2021)</xref>
</td>
<td align="center" valign="top">2021</td>
<td align="left" valign="top">Manual</td>
<td align="left" valign="top">ML</td>
<td align="left" valign="top">EL</td>
<td align="center" valign="top">3,077</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.971</td>
<td align="center" valign="top">0.937</td>
<td align="center" valign="top">0.958</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">34</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref7">Aramend&#x00ED;a-Vidaurreta et al. (2015)</xref>
</td>
<td align="center" valign="top">2015</td>
<td align="left" valign="top">Manual</td>
<td align="left" valign="top">ANN</td>
<td align="left" valign="top">MLP</td>
<td align="center" valign="top">145</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.9878</td>
<td align="center" valign="top">0.9850</td>
<td align="center" valign="top">0.9890</td>
<td align="center" valign="top">0.997</td>
<td align="center" valign="top">Unclear</td>
</tr>
<tr>
<td align="left" valign="top">35</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref39">Liu et al. (2024)</xref>
</td>
<td align="center" valign="top">2024</td>
<td align="left" valign="top">Manual</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">ResNet-101</td>
<td align="center" valign="top">1,080</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.849</td>
<td align="center" valign="top">0.930</td>
<td align="center" valign="top">0.817</td>
<td align="center" valign="top">0.935</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">36</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref40">Liu et al. (2024)</xref>
</td>
<td align="center" valign="top">2024</td>
<td align="left" valign="top">Manual</td>
<td align="left" valign="top">ML</td>
<td align="left" valign="top">LR</td>
<td align="center" valign="top">407</td>
<td align="left" valign="top">Cysts</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.948</td>
<td align="center" valign="top">0.955</td>
<td align="center" valign="top">0.942</td>
<td align="center" valign="top">0.981</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">37</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref18">Du et al. (2024)</xref>
</td>
<td align="center" valign="top">2024</td>
<td align="left" valign="top">Manual</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">ResNet-50</td>
<td align="center" valign="top">849</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">3</td>
<td align="center" valign="top">0.8003</td>
<td align="center" valign="top">0.7515</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.85</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">38</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref71">Tang et al. (2022)</xref>
</td>
<td align="center" valign="top">2022</td>
<td align="left" valign="top">Manual</td>
<td align="left" valign="top">ML</td>
<td align="left" valign="top">LR</td>
<td align="center" valign="top">206</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.886</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">39</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref1">Acharya et al. (2018)</xref>
</td>
<td align="center" valign="top">2018</td>
<td align="left" valign="top">Manual</td>
<td align="left" valign="top">ML</td>
<td align="left" valign="top">RF</td>
<td align="center" valign="top">469</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.8060</td>
<td align="center" valign="top">0.8140</td>
<td align="center" valign="top">0.7630</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">High</td>
</tr>
<tr>
<td align="left" valign="top">40</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref64">Sha (2024)</xref>
</td>
<td align="center" valign="top">2024</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">AdaResU-Net</td>
<td align="center" valign="top">700</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.9887</td>
<td align="center" valign="top">0.9850</td>
<td align="center" valign="top">0.9960</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">High</td>
</tr>
<tr>
<td align="left" valign="top">41</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref79">Xie et al. (2024)</xref>
</td>
<td align="center" valign="top">2024</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">CNN</td>
<td align="left" valign="top">YOLOv8</td>
<td align="center" valign="top">1,619</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.935</td>
<td align="center" valign="top">0.905</td>
<td align="center" valign="top">0.935</td>
<td align="center" valign="top">0.930</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">42</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref24">Giourga et al. (2024)</xref>
</td>
<td align="center" valign="top">2024</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">ML</td>
<td align="left" valign="top">EL</td>
<td align="center" valign="top">3,510</td>
<td align="left" valign="top">Cysts</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">0.909</td>
<td align="center" valign="top">0.965</td>
<td align="center" valign="top">0.881</td>
<td align="center" valign="top">0.922</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">43</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref25">He et al. (2024)</xref>
</td>
<td align="center" valign="top">2024</td>
<td align="left" valign="top">Manual</td>
<td align="left" valign="top">TBM</td>
<td align="left" valign="top">Swin transformer</td>
<td align="center" valign="top">7,639</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">0.872</td>
<td align="center" valign="top">0.943</td>
<td align="center" valign="top">0.920</td>
<td align="center" valign="top">Low</td>
</tr>
<tr>
<td align="left" valign="top">44</td>
<td align="left" valign="top">
<xref ref-type="bibr" rid="ref16">Dai et al. (2024)</xref>
</td>
<td align="center" valign="top">2024</td>
<td align="left" valign="top">Automatic</td>
<td align="left" valign="top">TBM</td>
<td align="left" valign="top">Pyramid visual transformer</td>
<td align="center" valign="top">6,938</td>
<td align="left" valign="top">Tumors</td>
<td align="center" valign="top">3</td>
<td align="center" valign="top">0.873</td>
<td align="center" valign="top">0.878</td>
<td align="center" valign="top">0.869</td>
<td align="center" valign="top">0.941</td>
<td align="center" valign="top">Low</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>AUC, area under the curve; CNN, convolutional neural network; FCNN, fuzzy rule-based convolutional neural network; ML, machine learning; SVM, support vector machine: RF, random forest; EL, ensemble learning; ANN, artificial neural network; DLRN, deep learning radiomics nomogram; PNN, probabilistic neural network; FDA, face detection algorithm; RNN, recurrent neural network; KNN, K-nearest neighbor; MLP, multilayer perceptron networks; LR, logistic regression; TBM, transformer-based models.</p>
</table-wrap-foot>
</table-wrap>
<sec id="sec21">
<label>3.1</label>
<title>Overall performance of AI models</title>
<p>The analysis of the 44 included studies revealed the high average diagnostic performance of AI models applied to B-mode TVS images for OC detection. The mean accuracy was 92.3%&#x202F;&#x00B1;&#x202F;5.8, with mean sensitivity and specificity of 91.6%&#x202F;&#x00B1;&#x202F;7.2 and 90.1%&#x202F;&#x00B1;&#x202F;8.1, respectively. AUC values were reported in only 23 studies, with a mean of 0.93&#x202F;&#x00B1;&#x202F;0.04, reflecting strong overall discriminative capacity. However, the partial availability of AUC reporting may indicate a potential reporting bias that limits the robustness of comparative analysis across all models. Beyond AUC&#x2019;s limited reporting (23/44 studies), F1-score was scarcely available across the corpus. This pattern likely reflects historical reliance on accuracy/sensitivity/specificity in ultrasound AI, frequent absence of continuous model scores (hindering AUC), and the lack of confusion matrices or class-wise results needed for F1. In addition, F1 is sometimes reported as Dice in segmentation studies; because our review targets classification performance, segmentation-specific Dice metrics were not pooled, which might also contribute to the perceived under-reporting of F1.</p>
<p><xref ref-type="fig" rid="fig2">Figure 2</xref> provides a comparative overview of the four main performance metrics for the 10 top-performing models. This visualization highlights how specific models exhibit strong accuracy yet relatively lower specificity, an observation with important clinical implications when considering false-positive rates in diagnostic triage.</p>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>Top 10 AI models (comparison of accuracy, sensitivity, specificity, and AUC). This figure compares performance metrics (accuracy, sensitivity, specificity, and AUC) of the 10 highest-performing AI models identified in the review. Generally high accuracy is observed across models, but some exhibit trade-offs between sensitivity and specificity. This variability highlights the importance of selecting models not only with high overall accuracy but also clinically meaningful balance to minimize diagnostic errors, particularly false positives and false negatives.</p>
</caption>
<graphic xlink:href="frai-08-1649746-g002.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Bar chart comparing performance scores of various models with metrics: accuracy, sensitivity, specificity, and AUC. Models include MLP, DenseNet, ResNext50, LR, ResNet-50, YOLOv8, ResNet-34, EL, DenseNet161, and Pyramid Visual Transformer, on a scale from 0.800 to 1.000.</alt-text>
</graphic>
</fig>
<p>Several models, including those based on OCD-FCNN, probabilistic neural networks (PNN), and ResNet-34, reported peak performance values exceeding 95%. However, many of these models were trained and tested on small or non-external datasets, lacked proper cross-validation, or relied exclusively on internal test sets. Such methodological limitations increase the likelihood of overfitting and restrict the generalizability of reported outcomes. None of the highest-performing models reported prospective validation or integration into clinical workflows, which remains essential for evaluating real-world applicability.</p>
<p>To assess whether methodological design influenced diagnostic performance, non-parametric tests were conducted using accuracy as the outcome variable. A Mann&#x2013;Whitney <italic>U</italic>-test revealed a statistically significant difference in accuracy between models using automatic versus manual segmentation (<italic>U</italic>&#x202F;=&#x202F;234.0, <italic>p</italic>&#x202F;=&#x202F;0.007), favoring automatic methods. This finding suggests that automated segmentation enhances standardization and reduces variability across studies.</p>
<p>Conversely, a Kruskal&#x2013;Wallis test comparing performance across AI architectures (e.g., CNN, ML, ANN) did not identify statistically significant differences (<italic>H</italic> =&#x202F;6.53, <italic>p</italic>&#x202F;=&#x202F;0.258), indicating that no specific architectural family demonstrated superior accuracy within the current dataset. Nevertheless, visual inspection using violin plots (<xref ref-type="fig" rid="fig3">Figure 3</xref>) showed a moderately higher central tendency and reduced the variance in accuracy among CNN-based models compared to classical machine learning (ML) approaches. While this pattern may reflect the architectural strengths of CNNs in capturing spatial hierarchies within medical images (<xref ref-type="bibr" rid="ref38">Litjens et al., 2017</xref>), it should be interpreted cautiously. CNN-based models were more frequently applied in recent studies, which may also have benefited from advances in data augmentation, automatic segmentation, and preprocessing pipelines. Therefore, the observed trend could be confounded by methodological improvements rather than an inherent advantage of architecture.</p>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption>
<p>Accuracy distribution by AI architecture: CNN vs. classical machine learning (ML). This figure illustrates that, although there is no statistically significant difference between architectures (<italic>p</italic>&#x202F;=&#x202F;0.258), CNN-based models tend to display higher median accuracy and reduced variability compared to classical ML models. This result suggests a potential advantage of CNNs, likely due to their superior ability to capture complex features from medical images, though methodological advances in recent studies may also contribute to this observed trend.</p>
</caption>
<graphic xlink:href="frai-08-1649746-g003.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Violin plot comparing accuracy of CNN and ML architectures. The CNN distribution is in blue, and ML is in orange. Both show similar median accuracies around 0.9.</alt-text>
</graphic>
</fig>
<p>It is also important to note that model performance was evaluated exclusively using accuracy, as this was the most consistently reported metric across studies. While this allowed for comparability, it may limit interpretability in class-imbalanced settings, where metrics such as AUC or F1-score are often more informative. Future studies should prioritize the reporting of multiple complementary metrics to capture diagnostic value more comprehensively.</p>
<p>These descriptive findings are further explored and formally tested in the meta-regression presented in Section 3.4.</p>
<p>In summary, while reported performance metrics are generally high, the absence of standardized validation protocols, partial reporting of key metrics, lack of weighted or stratified analyses, and underreporting of methodological variables (especially segmentation and validation strategies) limit the interpretability and clinical generalizability of the findings. Future studies should adopt harmonized reporting guidelines (e.g., TRIPOD-AI, PROBAST-AI), employ multicenter and external validation, and report performance metrics in clinically meaningful terms to support reliable and reproducible integration into diagnostic workflows.</p>
</sec>
<sec id="sec22">
<label>3.2</label>
<title>Relationship between dataset size and performance</title>
<p>The relationship between the number of images used to train AI models and their diagnostic performance was evaluated using non-parametric correlation analysis. Although Pearson&#x2019;s method was initially considered, the Shapiro&#x2013;Wilk test confirmed that dataset size and performance metrics (accuracy, sensitivity, specificity) were not normally distributed (<italic>p</italic>&#x202F;&#x003C;&#x202F;0.001 for all), prompting the use of Spearman&#x2019;s rank correlation.</p>
<p>Studies with more than 5,000 images were excluded from this analysis to reduce the risk of statistical distortion from highly imbalanced sample sizes. While large-scale datasets (up to 575,000 images) have become increasingly common in AI development, such volumes do not reflect typical clinical practice and may disproportionately drive correlation estimates. The 5,000-image threshold was selected to capture real-world data conditions better while preserving inter-study variability. Descriptive analysis of the full dataset showed that this threshold approximately corresponds to the 75th percentile of dataset sizes among included studies.</p>
<p>Spearman correlation coefficients between dataset size (&#x2264;5,000) and model performance metrics were weak and statistically non-significant. Specifically, the correlation with accuracy was <italic>&#x03C1;</italic>&#x202F;=&#x202F;0.080 (<italic>p</italic>&#x202F;=&#x202F;0.653), with a 95% confidence interval of &#x2212;0.27 to 0.41 and an <italic>R</italic><sup>2</sup> of 0.006, suggesting that less than 1% of the variation in accuracy could be explained by dataset size. For sensitivity, the correlation was &#x03C1;&#x202F;=&#x202F;0.246 (<italic>p</italic>&#x202F;=&#x202F;0.154; 95% CI: &#x2212;0.09 to 0.54; <italic>R</italic><sup>2</sup>&#x202F;=&#x202F;0.061), and for specificity, &#x03C1;&#x202F;=&#x202F;0.183 (<italic>p</italic>&#x202F;=&#x202F;0.350; 95% CI: &#x2212;0.20 to 0.52; <italic>R</italic><sup>2</sup>&#x202F;=&#x202F;0.034). <xref ref-type="table" rid="tab3">Table 3</xref> summarizes these results, including the correlation coefficients, confidence intervals, and the proportion of explained variance.</p>
<table-wrap position="float" id="tab3">
<label>Table 3</label>
<caption>
<p>Correlation between dataset size and performance metrics.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Performance metric</th>
<th align="center" valign="top">Spearman &#x03C1;</th>
<th align="center" valign="top">95% CI</th>
<th align="center" valign="top">
<italic>R</italic>
<sup>2</sup>
</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Accuracy</td>
<td align="center" valign="top">0.080</td>
<td align="center" valign="top">[&#x2212;0.27, 0.41]</td>
<td align="center" valign="top">0.006</td>
</tr>
<tr>
<td align="left" valign="top">Sensitivity</td>
<td align="center" valign="top">0.246</td>
<td align="center" valign="top">[&#x2212;0.09, 0.54]</td>
<td align="center" valign="top">0.061</td>
</tr>
<tr>
<td align="left" valign="top">Specificity</td>
<td align="center" valign="top">0.183</td>
<td align="center" valign="top">[&#x2212;0.20, 0.52]</td>
<td align="center" valign="top">0.034</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>While these findings suggest that increasing dataset size within the studied range does not systematically improve model performance, this interpretation should be cautiously made. The exclusion of large datasets may limit the generalizability of these findings, and potential interaction effects, such as those involving the segmentation method, risk of bias, or model architecture, were not examined in this univariate analysis. These results are, however, consistent with the multivariable meta-regression analysis presented in Section 4, in which dataset size did not emerge as a significant independent predictor of accuracy.</p>
<p>One plausible explanation lies in the widespread adoption of data augmentation strategies. Techniques such as image rotation, scaling, contrast adjustment, and noise addition simulate data variability and may reduce the dependency on raw volume. However, excessive use of augmentation may also lead to redundancy or learning saturation, where additional data no longer meaningfully improves generalization.</p>
<p>This interpretation is in line with prior literature. For instance, <xref ref-type="bibr" rid="ref60">Roberts et al. (2021)</xref> found that dataset size was not consistently associated with performance in a comprehensive medical imaging AI studies review. Instead, methodological rigor, validation strategy, and data diversity were identified as stronger predictors of performance. Furthermore, the risk of performance overestimation due to augmented or homogeneous datasets remains a critical concern in model evaluation.</p>
<p><xref ref-type="fig" rid="fig4">Figure 4</xref> presents scatterplots of accuracy, sensitivity, and specificity versus dataset size (&#x2264;5,000), each overlaid with a non-parametric LOWESS regression line and 95% confidence bands. While substantial scatters are observed across all metrics, the absence of clear or consistent directional trends underscores the importance of factors beyond sample size, such as annotation quality and experimental design in developing reliable diagnostic models.</p>
<fig position="float" id="fig4">
<label>Figure 4</label>
<caption>
<p>Non-parametric association between dataset size and model performance metrics (&#x2264;5,000 images). Scatter plots depict the relationship between dataset size and three key performance metrics: <bold>(A)</bold> accuracy, <bold>(B)</bold> sensitivity, and <bold>(C)</bold> specificity across studies with &#x2264;5,000 training images. The red lines represent LOWESS (locally weighted scatterplot smoothing) regression fits with 95% confidence bands. Although minor local variations are observed, no clear or systematic trend indicates a significant improvement in these performance metrics with increasing dataset size within the clinically relevant range analyzed. This finding suggests that methodological factors other than dataset size may have a greater influence on diagnostic model accuracy.</p>
</caption>
<graphic xlink:href="frai-08-1649746-g004.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Three scatter plots labeled A, B, and C show accuracy, sensitivity, and specificity versus dataset size, respectively, for sizes up to 5000. Orange dots represent data points, with red lines indicating trends. Plot A shows accuracy stabilizing after increasing. Plot B shows sensitivity slightly fluctuating but generally increasing. Plot C shows specificity peaking and then declining.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec23">
<label>3.3</label>
<title>Comparison between automatic and manual segmentation</title>
<p>To evaluate the impact of segmentation strategy on the diagnostic performance of AI models, performance metrics were compared between studies that implemented automatic segmentation (<italic>n</italic>&#x202F;=&#x202F;27) and those that used manual segmentation (<italic>n</italic>&#x202F;=&#x202F;17).</p>
<p>Models using automatic segmentation achieved a significantly higher average accuracy (94.2%&#x202F;&#x00B1;&#x202F;4.3) than manual segmentation (88.2%&#x202F;&#x00B1;&#x202F;6.6, <italic>p</italic>&#x202F;=&#x202F;0.012). Sensitivity also favored automatic segmentation (93.7%&#x202F;&#x00B1;&#x202F;5.6 vs. 88.6%&#x202F;&#x00B1;&#x202F;8.3, <italic>p</italic>&#x202F;=&#x202F;0.042). Although specificity was higher in the automatic group (92.5%&#x202F;&#x00B1;&#x202F;6.0 vs. 87.3%&#x202F;&#x00B1;&#x202F;9.5), the difference was not statistically significant (<italic>p</italic>&#x202F;=&#x202F;0.084). AUC values were nearly identical between both groups (<italic>p</italic>&#x202F;=&#x202F;0.839). Confidence intervals for these comparisons were not reported but are recommended for future studies to enhance the interpretability and reproducibility of statistical estimates.</p>
<p>Levene&#x2019;s test revealed a significantly more significant variance in specificity within the manual segmentation group (<italic>p</italic>&#x202F;=&#x202F;0.045), indicating less consistency. This is consistent with previous literature findings, highlighting manual segmentation&#x2019;s susceptibility to inter- and intra-observer variability, particularly when standardized annotation protocols or multiple expert raters are not employed (<xref ref-type="bibr" rid="ref70">Taha and Hanbury, 2015</xref>; <xref ref-type="bibr" rid="ref46">Menze et al., 2015</xref>).</p>
<p>Although the primary studies reported heterogeneous segmentation details that precluded a stratified meta-analysis by architecture, a brief practical comparison is informative for clinical implementation. U-Net remains the canonical encoder&#x2013;decoder with skip connections that performs well when lesion boundaries are reasonably defined, and training data are limited. AdaResU-Net augments U-Net with residual blocks and adaptive mechanisms that enlarge the effective receptive field and stabilize gradient flow, improving boundary delineation in speckle-rich ultrasound and in the presence of heterogeneous echotexture. In practice, U-Net offers simplicity and fast deployment; AdaResU-Net can yield crisper contours and fewer leakage errors near cyst walls at the cost of extra parameters. These architectural tradeoffs are likely to contribute to the higher and less variable accuracy we observed with automated vs. manual segmentation. Future primary studies should report standardized segmentation metrics (e.g., Dice, surface distance) alongside classification endpoints to enable formal architecture-level synthesis.</p>
<p><xref ref-type="fig" rid="fig5">Figure 5</xref> presents comparative boxplots of accuracy, sensitivity, specificity, and AUC by segmentation type. The distributions reveal higher mean values for automatic segmentation across most metrics, lower dispersion, and fewer outliers, especially for specificity and sensitivity. This visual trend suggests increased consistency, which may be attributed to the standardization benefits of automated pipelines.</p>
<fig position="float" id="fig5">
<label>Figure 5</label>
<caption>
<p>Diagnostic performance metrics stratified by segmentation type (automatic vs. manual). Boxplots illustrate the distribution of <bold>(A)</bold> accuracy, <bold>(B)</bold> sensitivity, <bold>(C)</bold> specificity, and <bold>(D)</bold> AUC across studies using either automatic or manual segmentation. Automatic segmentation models demonstrate higher mean values and reduced dispersion for most metrics, particularly accuracy and specificity. The manual segmentation group shows greater variability and outliers, suggesting less consistency. These visual differences align with the hypothesis that automated segmentation enhances reproducibility and standardization; however, causal interpretation should be made cautiously due to potential confounding factors.</p>
</caption>
<graphic xlink:href="frai-08-1649746-g005.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Box plots comparing automatic and manual methods across four metrics: (A) Accuracy, (B) Sensitivity, (C) Specificity, and (D) AUC. Automatic methods show higher median values in all metrics, with narrower interquartile ranges compared to manual methods. Outliers are present for the sensitivity and specificity metrics.</alt-text>
</graphic>
</fig>
<p><xref ref-type="table" rid="tab4">Table 4</xref> provides a detailed summary of methodological characteristics and performance metrics stratified by segmentation type. Studies using automatic segmentation not only performed better on average but also used considerably larger datasets (mean&#x202F;=&#x202F;22,941 vs. 1,121 images) and demonstrated lower standard deviation across metrics such as accuracy (4% vs. 7%) and specificity (6% vs. 10%).</p>
<table-wrap position="float" id="tab4">
<label>Table 4</label>
<caption>
<p>Dataset size and performance by segmentation type.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Segmentation</th>
<th align="center" valign="top">Size of dataset (mean)</th>
<th align="center" valign="top">Size of dataset (std)</th>
<th align="center" valign="top">Accuracy (mean)</th>
<th align="center" valign="top">Accuracy (std)</th>
<th align="center" valign="top">Sensitivity (mean)</th>
<th align="center" valign="top">Sensitivity (std)</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Automatic</td>
<td align="center" valign="top">22940.63</td>
<td align="center" valign="top">110529.7</td>
<td align="center" valign="top">0.94</td>
<td align="center" valign="top">0.04</td>
<td align="center" valign="top">0.94</td>
<td align="center" valign="top">0.06</td>
</tr>
<tr>
<td align="left" valign="top">Manual</td>
<td align="center" valign="top">1121.35</td>
<td align="center" valign="top">1818.76</td>
<td align="center" valign="top">0.88</td>
<td align="center" valign="top">0.07</td>
<td align="center" valign="top">0.89</td>
<td align="center" valign="top">0.08</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>However, this interpretation should be approached with caution. Although these group-level comparisons suggest superior performance with automatic segmentation, the analysis did not control for potential confounders such as dataset size, model architecture, training methodology, or publication year. Importantly, these variables may co-vary with segmentation strategy, particularly since automatic methods are more prevalent in recent, technically advanced studies.</p>
<p>As shown in the meta-regression (Section 3.4), the segmentation strategy remained a significant independent predictor of accuracy even after adjusting for these covariates. Nevertheless, the unadjusted differences observed here might still reflect broader methodological convergence rather than a causal advantage of automatic segmentation per se.</p>
<p>Future studies should incorporate multivariable models, harmonized annotation protocols, and prospective designs to clarify the segmentation method&#x2019;s isolated effect on AI model performance. Moreover, reporting standards such as STARD-AI and TRIPOD-AI should be adopted to ensure replicability and transparency in performance evaluation across studies (<xref ref-type="bibr" rid="ref15">Collins et al., 2021</xref>; <xref ref-type="bibr" rid="ref68">Sounderajah et al., 2021</xref>).</p>
</sec>
<sec id="sec24">
<label>3.4</label>
<title>Meta-regression analysis of methodological factors</title>
<p>To further explore the drivers of diagnostic performance, a meta-regression was performed using accuracy as the dependent variable and four predictors: dataset size, segmentation strategy (automatic vs. manual), model architecture (CNN vs. other), and risk of bias (high vs. low). The regression model included 26 studies with complete data across all variables (<xref ref-type="fig" rid="fig6">Figure 6</xref>).</p>
<fig position="float" id="fig6">
<label>Figure 6</label>
<caption>
<p>Meta-regression coefficients with 95% confidence intervals. This figure presents the coefficients resulting from the meta-regression analysis evaluating the relative influence of various methodological factors on diagnostic accuracy. Only automatic segmentation demonstrated a statistically significant effect on accuracy (<italic>p</italic>&#x202F;=&#x202F;0.007), whereas other factors such as dataset size, architecture type (CNN vs. others), and risk of bias did not reach statistical significance. This outcome emphasizes the critical importance of automated segmentation quality as a key determinant of AI model performance.</p>
</caption>
<graphic xlink:href="frai-08-1649746-g006.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Bar chart showing the effect on accuracy by different predictors. Segmentation_binary has the highest positive effect, followed by Bias_HighRisk and Architecture_CNN. The size of the dataset shows no effect.</alt-text>
</graphic>
</fig>
<p>The overall model was statistically significant (<italic>F</italic>&#x202F;=&#x202F;3.98, <italic>p</italic>&#x202F;=&#x202F;0.015), with an adjusted <italic>R</italic><sup>2</sup> of 0.32, indicating that the included predictors could explain approximately 32% of the variance in reported accuracy.</p>
<p>Among the covariates, segmentation strategy emerged as a significant predictor: studies using automatic segmentation reported on average, a 6.6 percentage point higher accuracy compared to those using manual segmentation (<italic>&#x03B2;</italic>&#x202F;=&#x202F;0.0656, <italic>p</italic>&#x202F;=&#x202F;0.007). This aligns with previous findings suggesting that automated preprocessing may reduce inter-observer variability and improve reproducibility.</p>
<p>Other predictors, such as dataset size, CNN architecture, and risk of bias, were not statistically significant at the conventional threshold (<italic>p</italic>&#x202F;&#x003E;&#x202F;0.050). However, the effect of high risk of bias approached significance (<italic>&#x03B2;</italic>&#x202F;=&#x202F;0.0427, <italic>p</italic>&#x202F;=&#x202F;0.096), suggesting a possible inflation of performance estimates in studies with methodological limitations.</p>
<p>Notably, dataset size was not a significant predictor (<italic>p</italic>&#x202F;=&#x202F;0.323), corroborating earlier findings that performance does not linearly scale with sample size within the studied range, possibly due to saturation effects or compensatory use of data augmentation techniques.</p>
<p>These results reinforce the critical role of segmentation quality in shaping model performance and highlight the need for more standardized methodologies and transparent reporting in AI-based diagnostic research.</p>
</sec>
<sec id="sec25">
<label>3.5</label>
<title>Temporal analysis</title>
<p>The progression of AI architectures in the included studies reflects a clear methodological shift over time. Temporal analysis of architectural usage revealed a transition from traditional ML techniques and ANNs to DL approaches, particularly CNNs. Between 2014 and 2018, studies primarily employed ML methods such as support vector machines (SVM), random forests (RF), and logistic regression (LR), representing approximately 85% of the methodologies used during this period. ANN-type architecture was also present, constituting roughly 15% of studies, while no CNN-based models were recorded before 2020.</p>
<p><xref ref-type="fig" rid="fig7">Figure 7</xref> presents a stacked bar chart showing the number of studies using each architecture per year. CNNs emerged in 2020, accounting for 20% of the methodologies that year, and showed a marked increase in 2021, becoming the predominant architecture (65% of studies) in 2022. This trend intensified through 2023 (72% of studies) and 2024 (78% of studies), with CNNs accounting for more than half of the models evaluated annually. Transformer-based architectures, specifically Swin Transformer and Pyramid Vision Transformer, appeared exclusively in 2024, accounting for approximately 10% of the methodologies that year, indicating the beginning of a new phase of exploration focused on models with advanced contextual attention mechanisms and long-range feature integration.</p>
<fig position="float" id="fig7">
<label>Figure 7</label>
<caption>
<p>This figure illustrates the temporal evolution in the use of different AI architectures from 2014 to 2024. A clear shift is observed from classical machine learning techniques (ML and ANN) to deep learning models (CNN), particularly from 2021 onwards, with transformer-based models appearing more recently (2024). This evolution reflects a continuous methodological transition toward increasingly sophisticated architectures capable of directly and deeply extracting information from images. However, this shift may also coincide with general methodological improvements over time.</p>
</caption>
<graphic xlink:href="frai-08-1649746-g007.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Stacked bar chart showing the number of AI studies published from 2014 to 2024, with categories for AI architectures: ANN, CNN, FDA, ML, RNN, and TBN. Notable increase in 2024.</alt-text>
</graphic>
</fig>
<p>This shift mirrors broader trends observed across diagnostic imaging AI, where deep architectures have largely replaced classical ML techniques due to their ability to learn hierarchical features directly from raw images without manual feature engineering (<xref ref-type="bibr" rid="ref38">Litjens et al., 2017</xref>; <xref ref-type="bibr" rid="ref20">Esteva et al., 2019</xref>). However, this evolution may also explain some of the performance differences observed in earlier sections. For example, the predominance of CNNs in recent years may co-occur with advances in preprocessing, data augmentation, and training infrastructure, confounding the interpretation of architecture-based performance gains.</p>
<p>Notably, this trend may influence perceived model superiority, as CNN-based studies often reflect newer methodological standards, including automatic segmentation and more rigorous evaluation protocols. These temporal patterns underscore the importance of accounting for publication year and technological maturity when comparing performance across architectures or studies.</p>
</sec>
<sec id="sec26">
<label>3.6</label>
<title>Heterogeneity and risk of bias analysis</title>
<p>To evaluate how methodological quality influences the reported performance of AI models, the 44 included studies were classified according to their overall risk of bias using the PROBAST tool. In total, 26 studies were classified as low risk of bias, 12 as unclear risk, and six as high risk (<xref ref-type="fig" rid="fig8">Figure 8</xref>). However, not all studies reported all performance metrics, and the number of studies included varied substantially by metric. This heterogeneity in reporting introduces selection bias and impairs comparability.</p>
<fig position="float" id="fig8">
<label>Figure 8</label>
<caption>
<p>Distribution of risk of bias across PROBAST domains and associated model performance metrics. <bold>(A)</bold> Distribution of the 44 included studies across the four PROBAST domains (participants, predictors, outcomes, and analysis), categorized by overall risk of bias (low, unclear, and high). <bold>(B)</bold> Mean values of accuracy, sensitivity, specificity, and AUC, stratified by overall risk of bias. Studies classified as high risk consistently report higher mean values for accuracy, sensitivity, and specificity but exhibit greater variability and frequently lack AUC reporting, indicating potential methodological overfitting. Studies with low risk exhibit more consistent and reliable performance metrics.</p>
</caption>
<graphic xlink:href="frai-08-1649746-g008.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Chart A displays the number of studies across different PROBAST domains with risk levels: low (green), unclear (yellow), and high (red). Chart B shows mean values for accuracy, sensitivity, specificity, and AUC with the same risk levels. Both charts highlight the distribution and influence of risk levels in study assessments.</alt-text>
</graphic>
</fig>
<p>Studies classified as high risk of bias showed markedly elevated performance metrics, with a mean accuracy of 96.1%&#x202F;&#x00B1;&#x202F;7.6, a sensitivity of 95.4%&#x202F;&#x00B1;&#x202F;7.9, and a specificity of 93.9%&#x202F;&#x00B1;&#x202F;11.7. However, none of these studies reported areas under the curve (AUC) values, precluding the complete evaluation of discriminative performance. Moreover, the elevated standard deviation in specificity suggests potential overfitting, likely arising from methodologically weak practices such as internal validation without cross-validation, small sample sizes, and operator-dependent manual segmentation (<xref ref-type="bibr" rid="ref75">Wolff et al., 2019</xref>; <xref ref-type="bibr" rid="ref15">Collins et al., 2021</xref>). These practices have been consistently linked to inflated model performance in machine learning for medical imaging (<xref ref-type="bibr" rid="ref32">Kelly et al., 2019</xref>).</p>
<p>In contrast, low-risk studies showed more conservative but consistent performance metrics, with lower dispersion and complete reporting of AUC. Specifically, they reported an accuracy of 90.4%&#x202F;&#x00B1;&#x202F;5.2 (<italic>n</italic> =&#x202F;20), a sensitivity of 90.7%&#x202F;&#x00B1;&#x202F;7.0 (<italic>n</italic>&#x202F;=&#x202F;25), a specificity of 89.1%&#x202F;&#x00B1;&#x202F;8.2 (<italic>n</italic>&#x202F;=&#x202F;22), and an AUC of 93.5%&#x202F;&#x00B1;&#x202F;3.9 (<italic>n</italic>&#x202F;=&#x202F;20). While these results appear numerically inferior, the reduced variability and broader metric completeness suggest higher methodological reliability and clinical applicability.</p>
<p>The unclear-risk group, often the result of poor reporting rather than clearly defined methodological shortcomings, yielded intermediate metrics (accuracy: 93.6%&#x202F;&#x00B1;&#x202F;5.0; sensitivity: 91.9%&#x202F;&#x00B1;&#x202F;7.7; specificity: 91.1%&#x202F;&#x00B1;&#x202F;5.4; AUC: 92.2%&#x202F;&#x00B1;&#x202F;4.6). However, the small and variable sample sizes for each metric (e.g., <italic>n</italic>&#x202F;=&#x202F;6 for specificity) compromise interpretability and hinder statistical power.</p>
<p>A sensitivity analysis was conducted excluding high-risk studies, which resulted in a notable reduction in extreme values (e.g., 100% accuracy) and decreased overall dispersion, particularly in specificity. However, this analysis was limited by the lack of formal statistical testing (e.g., ANOVA or Kruskal&#x2013;Wallis) to assess whether differences between groups were statistically significant. Furthermore, no regression adjustment was made for potential confounders such as dataset size or model complexity. These omissions limit the strength of causal inferences between risk of bias and reported model performance.</p>
<p>The primary sources of methodological heterogeneity across studies were identified as follows: (i) reliance on manual, operator-dependent image segmentation; (ii) absence of cross-validation or external validation; (iii) small sample sizes (&#x003C;200 cases); and (iv) lack of standardized metric reporting formats. These deficiencies were most prevalent in high- and unclear-risk studies, consistent with prior evidence from systematic reviews of machine learning in healthcare (<xref ref-type="bibr" rid="ref68">Sounderajah et al., 2021</xref>; <xref ref-type="bibr" rid="ref41">Liu et al., 2019</xref>).</p>
<p>Finally, this section would benefit from including confidence intervals and formal effect size estimates to contextualize differences across bias strata. Without these, claims about &#x201C;superior&#x201D; or &#x201C;more stable&#x201D; performance remain largely descriptive and potentially misleading.</p>
</sec>
</sec>
<sec sec-type="discussion" id="sec27">
<label>4</label>
<title>Discussion</title>
<p>The analyzed studies demonstrate generally high diagnostic performance of AI models for classifying ovarian masses using B-mode TVS. Most studies achieved AUC values ranging from 0.85 to 0.95, with sensitivity and specificity typically above 80% (<xref ref-type="bibr" rid="ref1">Acharya et al., 2018</xref>; <xref ref-type="bibr" rid="ref62">Sadeghi et al., 2024</xref>). However, substantial heterogeneity across studies suggests caution when interpreting pooled performance metrics due to sample size, class balance, and data quality variations.</p>
<p>Automatic segmentation demonstrated statistically significant accuracy and sensitivity superior to manual segmentation, likely due to reduced observer variability (<italic>p</italic>&#x202F;=&#x202F;0.007 and <italic>p</italic>&#x202F;=&#x202F;0.042, respectively). Although manual segmentation provides potentially optimal delineation by experts, it is prone to operator-dependent biases. Automatic segmentation offers reproducibility and scalability but introduces errors if segmentation quality is suboptimal (<xref ref-type="bibr" rid="ref13">Chiappa et al., 2021</xref>). Given these findings, future research should explicitly compare different segmentation algorithms and validate them against expert delineation standards to enhance clinical applicability.</p>
<p>Contrary to expectations, dataset size alone showed no clear correlation with diagnostic performance within datasets &#x2264;5,000 images. Small datasets sometimes reported exceptional accuracy, likely due to extensive data augmentation strategies, while larger datasets faced increased variability and complexity, offsetting potential accuracy gains (<xref ref-type="bibr" rid="ref1">Acharya et al., 2018</xref>; <xref ref-type="bibr" rid="ref41">Liu et al., 2019</xref>). Thus, methodological rigor, dataset diversity, and validation strategy appear more influential than dataset volume alone.</p>
<p>Comparison among model architectures (classical ML, CNNs, and Transformers) revealed no consistent superiority. Traditional ML models and simple neural networks occasionally matched the performance of sophisticated CNNs and Transformers (<xref ref-type="bibr" rid="ref1">Acharya et al., 2018</xref>). Although CNN-based models showed visually higher median accuracy and reduced variance, no statistically significant differences were observed across architectures (<italic>p</italic>&#x202F;=&#x202F;0.258). Superior results often correlated with modern methodological standards rather than architectural innovation alone. Future research should directly compare these architectures under standardized experimental conditions to clarify intrinsic performance differences clearly.</p>
<p>The risk of bias significantly affected the result&#x2019;s validity. Studies with high or unclear bias frequently reported inflated performance metrics with notable dispersion (e.g., specificity SD&#x202F;=&#x202F;11.7%) due to methodological weaknesses like internal-only validation, small sample sizes, and lack of external validation (<xref ref-type="bibr" rid="ref68">Sounderajah et al., 2021</xref>; <xref ref-type="bibr" rid="ref60">Roberts et al., 2021</xref>). Such biases undermine clinical generalizability, emphasizing the need for rigorous validation standards (e.g., TRIPOD-AI, STARD-AI) and multicenter, prospective validation.</p>
<p>Temporal analysis showed methodological evolution influencing perceived performance gains. Despite less sophisticated techniques, earlier studies occasionally reported superior outcomes due to less rigorous validation methods, whereas recent studies employed stricter evaluation, tempering observed performance improvements (<xref ref-type="bibr" rid="ref68">Sounderajah et al., 2021</xref>; <xref ref-type="bibr" rid="ref60">Roberts et al., 2021</xref>). Therefore, performance comparisons across time should account for these evolving methodological contexts.</p>
<p>Recent advances emphasize the critical importance of precise methodological design and targeted biological understanding. For instance, <xref ref-type="bibr" rid="ref42">Liu et al. (2024)</xref> highlighted how epitope-specific targeting of HER2 significantly influences therapeutic outcomes in solid tumors, illustrating the necessity of methodological precision in clinical efficacy. Similarly, <xref ref-type="bibr" rid="ref43">Ma et al. (2023)</xref> underscored the potential benefits of integrating detailed molecular insights into advanced diagnostics by showing how the glycolytic enzyme ENO1 modulates choline phospholipid metabolism and tumor proliferation. Such multidisciplinary integration may substantially improve cancer characterization and patient outcomes.</p>
<p>AI currently demonstrates potential as an adjunctive diagnostic tool rather than a standalone solution. Real-world applicability requires rigorous external validations, standardized metric reporting (e.g., sensitivity, specificity, predictive values), and integration within clinical workflows. Moreover, evaluating the clinical impact of AI, particularly for distinguishing borderline ovarian lesions, remains essential due to their clinical complexity and diagnostic challenges (<xref ref-type="bibr" rid="ref60">Roberts et al., 2021</xref>).</p>
<p>Given the limited reporting of comprehensive metrics like AUC and F1-score, future studies should ensure the consistent inclusion of these metrics to improve clinical interpretability and decision-making.</p>
<p>In conclusion, while AI models for ovarian mass classification via TVS demonstrate promising diagnostic accuracy, significant methodological limitations currently restrict their clinical translation. Future research must prioritize external validation, robust methodological standards, multidisciplinary integration, and transparent, standardized reporting. Prospective, multicenter studies remain crucial to fully validate these models&#x2019; clinical utility, generalizability, and real-world applicability.</p>
</sec>
<sec sec-type="conclusions" id="sec28">
<label>5</label>
<title>Conclusion</title>
<p>AI models applied to B-mode TVS images demonstrate strong diagnostic performance for classifying ovarian masses, achieving high sensitivity, specificity, and overall discriminative ability (AUC). Automated segmentation significantly outperformed manual methods in accuracy and sensitivity, likely due to enhanced standardization and reduced inter-observer variability.</p>
<p>Nevertheless, these findings must be interpreted cautiously due to considerable methodological heterogeneity, variations in dataset size and quality, and significant risks of bias identified among several studies. Additionally, no consistent superiority emerged among different AI architectures (CNNs, classical ML, or Transformers), suggesting that methodological rigor, validation procedures, and data standardization may be more influential determinants of performance than the specific model architecture itself.</p>
<p>Future research should prioritize prospective, multicenter external validation under realistic clinical conditions for reliable clinical translation. Moreover, rigorous adherence to standardized reporting guidelines (e.g., TRIPOD-AI, STARD-AI), comprehensive metric reporting, including sensitivity, specificity, AUC, and F1-score, and explicit evaluation of clinical utility, especially in distinguishing borderline ovarian lesions, are essential.</p>
<p>In summary, while AI holds significant promise for OC diagnosis using TVS, overcoming current methodological limitations through robust validation and standardized methodological practices is imperative for successful integration into clinical practice.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec29">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref rid="SM1" ref-type="supplementary-material">Supplementary material</xref>, further inquiries can be directed to the corresponding author.</p>
</sec>
<sec sec-type="author-contributions" id="sec30">
<title>Author contributions</title>
<p>IG-A: Formal analysis, Data curation, Writing &#x2013; original draft, Conceptualization, Investigation, Writing &#x2013; review &#x0026; editing, Methodology. FV-F: Formal analysis, Writing &#x2013; review &#x0026; editing, Methodology, Funding acquisition, Writing &#x2013; original draft. EB: Methodology, Writing &#x2013; review &#x0026; editing, Investigation, Conceptualization, Formal analysis. JS-V: Investigation, Writing &#x2013; review &#x0026; editing, Methodology, Conceptualization. JM-M: Conceptualization, Methodology, Investigation, Writing &#x2013; review &#x0026; editing. AB-C: Writing &#x2013; review &#x0026; editing, Methodology, Conceptualization, Investigation, Funding acquisition.</p>
</sec>
<sec sec-type="funding-information" id="sec31">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This work was supported by the Program for Mobility, Cooperation, and Internationalization &#x2018;&#x2018;Jim&#x00E9;nez de la Espada&#x2019;&#x2019; under Grant 22466/EE/24 of Andr&#x00E9;s Bueno-Crespo funded by the Seneca Foundation &#x2013; Agency for Science and Technology in the Region of Murcia.</p>
</sec>
<sec sec-type="COI-statement" id="sec32">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="sec33">
<title>Generative AI statement</title>
<p>The authors declare that Gen AI was used in the creation of this manuscript. During the preparation of this manuscript, the authors used ChatGPT to enhance language and readability. After employing this tool, the authors reviewed and edited the content as necessary and assume full responsibility for the content of the publication.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="sec34">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="sec35">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/frai.2025.1649746/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/frai.2025.1649746/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Acharya</surname><given-names>U. R.</given-names></name> <name><surname>Akter</surname><given-names>A.</given-names></name> <name><surname>Chowriappa</surname><given-names>P.</given-names></name> <name><surname>Dua</surname><given-names>S.</given-names></name> <name><surname>Raghavendra</surname><given-names>U.</given-names></name> <name><surname>Koh</surname><given-names>J. E. W.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Use of nonlinear features for automated characterization of suspicious ovarian tumors using ultrasound images in fuzzy forest framework</article-title>. <source>Int. J. Fuzzy Syst.</source> <volume>20</volume>, <fpage>1385</fpage>&#x2013;<lpage>1402</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s40815-018-0456-9</pub-id></citation></ref>
<ref id="ref2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Acharya</surname><given-names>U. R.</given-names></name> <name><surname>Mookiah</surname><given-names>M. R. K.</given-names></name> <name><surname>Vinitha Sree</surname><given-names>S.</given-names></name> <name><surname>Yanti</surname><given-names>R.</given-names></name> <name><surname>Martis</surname><given-names>R. J.</given-names></name> <name><surname>Saba</surname><given-names>L.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Evolutionary algorithm-based classifier parameter tuning for automatic ovarian cancer tissue characterization and classification</article-title>. <source>Ultraschall Med.</source> <volume>35</volume>, <fpage>237</fpage>&#x2013;<lpage>245</lpage>. doi: <pub-id pub-id-type="doi">10.1055/s-0032-1330336</pub-id>, PMID: <pub-id pub-id-type="pmid">23258769</pub-id></citation></ref>
<ref id="ref3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Acharya</surname><given-names>U. R.</given-names></name> <name><surname>Sree</surname><given-names>S. V.</given-names></name> <name><surname>Kulshreshtha</surname><given-names>S.</given-names></name> <name><surname>Molinari</surname><given-names>F.</given-names></name> <name><surname>Koh</surname><given-names>J. E. W.</given-names></name> <name><surname>Saba</surname><given-names>L.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>GyneScan: an improved online paradigm for screening of ovarian Cancer via tissue characterization</article-title>. <source>Technol. Cancer Res. Treat.</source> <volume>13</volume>, <fpage>529</fpage>&#x2013;<lpage>539</lpage>. doi: <pub-id pub-id-type="doi">10.7785/tcrtexpress.2013.600273</pub-id>, PMID: <pub-id pub-id-type="pmid">24325128</pub-id></citation></ref>
<ref id="ref4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Akazawa</surname><given-names>M.</given-names></name> <name><surname>Hashimoto</surname><given-names>K.</given-names></name></person-group> (<year>2021</year>). <article-title>Artificial intelligence in gynecologic cancers: current status and future challenges &#x2013; a systematic review</article-title>. <source>Artif. Intell. Med.</source> <volume>120</volume>:<fpage>102164</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.artmed.2021.102164</pub-id>, PMID: <pub-id pub-id-type="pmid">34629152</pub-id></citation></ref>
<ref id="ref5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Al-karawi</surname><given-names>D.</given-names></name> <name><surname>Al-Assam</surname><given-names>H.</given-names></name> <name><surname>Du</surname><given-names>H.</given-names></name> <name><surname>Sayasneh</surname><given-names>A.</given-names></name> <name><surname>Landolfo</surname><given-names>C.</given-names></name> <name><surname>Timmerman</surname><given-names>D.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>An evaluation of the effectiveness of image-based texture features extracted from static B-mode ultrasound images in distinguishing between benign and malignant ovarian masses</article-title>. <source>Ultrason. Imaging</source> <volume>43</volume>, <fpage>124</fpage>&#x2013;<lpage>138</lpage>. doi: <pub-id pub-id-type="doi">10.1177/0161734621998091</pub-id>, PMID: <pub-id pub-id-type="pmid">33629652</pub-id></citation></ref>
<ref id="ref6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Alwan</surname><given-names>O. F.</given-names></name> <name><surname>Kadhim</surname><given-names>Q. K.</given-names></name> <name><surname>Issa</surname><given-names>R. B.</given-names></name> <name><surname>Ahmed</surname><given-names>S. T.</given-names></name></person-group> (<year>2023</year>). <article-title>Early detection and segmentation of ovarian tumor using convolutional neural network with ultrasound imaging</article-title>. <source>Rev. Intell. Artif.</source> <volume>37</volume>, <fpage>1503</fpage>&#x2013;<lpage>1509</lpage>. doi: <pub-id pub-id-type="doi">10.18280/ria.370614</pub-id></citation></ref>
<ref id="ref7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Aramend&#x00ED;a-Vidaurreta</surname><given-names>V.</given-names></name> <name><surname>Cabeza</surname><given-names>R.</given-names></name> <name><surname>Villanueva</surname><given-names>A.</given-names></name> <name><surname>Navallas</surname><given-names>J.</given-names></name> <name><surname>Alc&#x00E1;zar</surname><given-names>J. L.</given-names></name></person-group> (<year>2015</year>). <article-title>Ultrasound image discrimination between benign and malignant adnexal masses based on a neural network approach</article-title>. <source>Ultrasound Med. Biol.</source> <volume>42</volume>, <fpage>742</fpage>&#x2013;<lpage>752</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ultrasmedbio.2015.11.014</pub-id></citation></ref>
<ref id="ref8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Badgwell</surname><given-names>D.</given-names></name> <name><surname>Bast</surname><given-names>R. C.</given-names></name></person-group> (<year>2007</year>). <article-title>Early detection of ovarian cancer</article-title>. <source>Dis. Markers</source> <volume>23</volume>, <fpage>397</fpage>&#x2013;<lpage>410</lpage>. doi: <pub-id pub-id-type="doi">10.1155/2007/309382</pub-id>, PMID: <pub-id pub-id-type="pmid">18057523</pub-id></citation></ref>
<ref id="ref9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bast</surname><given-names>R. C.</given-names></name> <name><surname>Brewer</surname><given-names>M.</given-names></name> <name><surname>Zou</surname><given-names>C.</given-names></name> <name><surname>Hernandez</surname><given-names>M. A.</given-names></name> <name><surname>Daley</surname><given-names>M.</given-names></name> <name><surname>Ozols</surname><given-names>R.</given-names></name> <etal/></person-group>. (<year>2007</year>). <article-title>Prevention and early detection of ovarian cancer: mission impossible?</article-title> <source>Recent Results Cancer Res.</source> <volume>174</volume>, <fpage>91</fpage>&#x2013;<lpage>100</lpage>. doi: <pub-id pub-id-type="doi">10.1007/978-3-540-37696-5_9</pub-id></citation></ref>
<ref id="ref10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>B&#x00E4;umler</surname><given-names>M.</given-names></name> <name><surname>Gallant</surname><given-names>D.</given-names></name> <name><surname>Druckmann</surname><given-names>R.</given-names></name> <name><surname>Kuhn</surname><given-names>W.</given-names></name></person-group> (<year>2020</year>). <article-title>Ultrasound screening of ovarian cancer</article-title>. <source>Horm. Mol. Biol. Clin. Invest.</source> <volume>41</volume>:<fpage>20190022</fpage>. doi: <pub-id pub-id-type="doi">10.1515/hmbci-2019-0022</pub-id>, PMID: <pub-id pub-id-type="pmid">31661436</pub-id></citation></ref>
<ref id="ref11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bowtell</surname><given-names>D.</given-names></name> <name><surname>B&#x00F6;hm</surname><given-names>S.</given-names></name> <name><surname>Ahmed</surname><given-names>A.</given-names></name> <name><surname>Aspuria</surname><given-names>P.</given-names></name> <name><surname>Bast</surname><given-names>R.</given-names></name> <name><surname>Beral</surname><given-names>V.</given-names></name></person-group> (<year>2015</year>). <article-title>Rethinking ovarian cancer part II: reducing mortality from high-grade serous ovarian cancer</article-title>. <source>Nat. Rev. Cancer</source> <volume>15</volume>, <fpage>668</fpage>&#x2013;<lpage>679</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nrc4019</pub-id>, PMID: <pub-id pub-id-type="pmid">26493647</pub-id></citation></ref>
<ref id="ref12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname><given-names>H.</given-names></name> <name><surname>Yang</surname><given-names>B.-W.</given-names></name> <name><surname>Qian</surname><given-names>L.</given-names></name> <name><surname>Meng</surname><given-names>Y.-S.</given-names></name> <name><surname>Bai</surname><given-names>X.-H.</given-names></name> <name><surname>Hong</surname><given-names>X.-W.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Deep learning prediction of ovarian malignancy at US compared with O-RADS and expert assessment</article-title>. <source>Radiology</source> <volume>304</volume>, <fpage>106</fpage>&#x2013;<lpage>113</lpage>. doi: <pub-id pub-id-type="doi">10.1148/radiol.211367</pub-id>, PMID: <pub-id pub-id-type="pmid">35412367</pub-id></citation></ref>
<ref id="ref13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chiappa</surname><given-names>V.</given-names></name> <name><surname>Bogani</surname><given-names>G.</given-names></name> <name><surname>Interlenghi</surname><given-names>M.</given-names></name> <name><surname>Salvatore</surname><given-names>C.</given-names></name> <name><surname>Bertolina</surname><given-names>F.</given-names></name> <name><surname>Sarpietro</surname><given-names>G.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>The adoption of radiomics and machine learning improves the diagnostic processes of women with ovarian masses (the AROMA pilot study)</article-title>. <source>J. Ultrasound</source> <volume>24</volume>, <fpage>429</fpage>&#x2013;<lpage>437</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s40477-020-00503-5</pub-id>, PMID: <pub-id pub-id-type="pmid">32696414</pub-id></citation></ref>
<ref id="ref14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Christiansen</surname><given-names>F.</given-names></name> <name><surname>Epstein</surname><given-names>E.</given-names></name> <name><surname>Smedberg</surname><given-names>E.</given-names></name> <name><surname>&#x00C5;kerlund</surname><given-names>M.</given-names></name> <name><surname>Smith</surname><given-names>K.</given-names></name> <name><surname>Epstein</surname><given-names>E.</given-names></name></person-group> (<year>2021</year>). <article-title>Ultrasound image analysis using deep neural networks for discriminating between benign and malignant ovarian tumors: comparison with expert subjective assessment</article-title>. <source>Ultrasound Obstet. Gynecol.</source> <volume>57</volume>, <fpage>155</fpage>&#x2013;<lpage>163</lpage>. doi: <pub-id pub-id-type="doi">10.1002/uog.23530</pub-id>, PMID: <pub-id pub-id-type="pmid">33142359</pub-id></citation></ref>
<ref id="ref15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Collins</surname><given-names>G. S.</given-names></name> <name><surname>Dhiman</surname><given-names>P.</given-names></name> <name><surname>Andaur Navarro</surname><given-names>C. L.</given-names></name> <name><surname>Ma</surname><given-names>J.</given-names></name> <name><surname>Hooft</surname><given-names>L.</given-names></name> <name><surname>Reitsma</surname><given-names>J. B.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Protocol for development of a reporting guideline (TRIPOD-AI) and risk of bias tool (PROBAST-AI) for diagnostic and prognostic prediction model studies based on artificial intelligence</article-title>. <source>BMJ Open</source> <volume>11</volume>:<fpage>e048008</fpage>. doi: <pub-id pub-id-type="doi">10.1136/bmjopen-2020-048008</pub-id>, PMID: <pub-id pub-id-type="pmid">34244270</pub-id></citation></ref>
<ref id="ref16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dai</surname><given-names>W.-L.</given-names></name> <name><surname>Wu</surname><given-names>Y.-N.</given-names></name> <name><surname>Ling</surname><given-names>Y.-T.</given-names></name> <name><surname>Zhao</surname><given-names>J.</given-names></name> <name><surname>Zhang</surname><given-names>S.</given-names></name> <name><surname>Gu</surname><given-names>Z.-W.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Development and validation of a deep learning pipeline to diagnose ovarian masses using ultrasound screening: a retrospective multicenter study</article-title>. <source>EClinicalMedicine</source> <volume>78</volume>:<fpage>102923</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.eclinm.2024.102923</pub-id>, PMID: <pub-id pub-id-type="pmid">39640935</pub-id></citation></ref>
<ref id="ref17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dalmartello</surname><given-names>M.</given-names></name> <name><surname>La Vecchia</surname><given-names>C.</given-names></name> <name><surname>Bertuccio</surname><given-names>P.</given-names></name> <name><surname>Boffetta</surname><given-names>P.</given-names></name> <name><surname>Levi</surname><given-names>F.</given-names></name> <name><surname>Negri</surname><given-names>E.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>European cancer mortality predictions for the year 2022 with focus on ovarian cancer</article-title>. <source>Ann. Oncol. Off. J. Eur. Soc. Med. Oncol.</source> <volume>33</volume>, <fpage>330</fpage>&#x2013;<lpage>339</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.annonc.2021.12.007</pub-id>, PMID: <pub-id pub-id-type="pmid">35090748</pub-id></citation></ref>
<ref id="ref18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Du</surname><given-names>Y.</given-names></name> <name><surname>Guo</surname><given-names>W.</given-names></name> <name><surname>Xiao</surname><given-names>Y.</given-names></name> <name><surname>Chen</surname><given-names>H.</given-names></name> <name><surname>Yao</surname><given-names>J.</given-names></name> <name><surname>Wu</surname><given-names>J.</given-names></name></person-group> (<year>2024</year>). <article-title>Ultrasound-based deep learning radiomics model for differentiating benign, borderline, and malignant ovarian tumours: a multi-class classification exploratory study</article-title>. <source>BMC Med. Imaging</source> <volume>24</volume>:<fpage>89</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12880-024-01251-2</pub-id>, PMID: <pub-id pub-id-type="pmid">38622546</pub-id></citation></ref>
<ref id="ref19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Du</surname><given-names>Y.</given-names></name> <name><surname>Xiao</surname><given-names>Y.</given-names></name> <name><surname>Guo</surname><given-names>W.</given-names></name> <name><surname>Yao</surname><given-names>J.</given-names></name> <name><surname>Lan</surname><given-names>T.</given-names></name> <name><surname>Li</surname><given-names>S.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Development and validation of an ultrasound-based deep learning radiomics nomogram for predicting the malignant risk of ovarian tumours</article-title>. <source>Biomed. Eng. Online</source> <volume>23</volume>:<fpage>41</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12938-024-01234-y</pub-id>, PMID: <pub-id pub-id-type="pmid">38594729</pub-id></citation></ref>
<ref id="ref20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Esteva</surname><given-names>A.</given-names></name> <name><surname>Robicquet</surname><given-names>A.</given-names></name> <name><surname>Ramsundar</surname><given-names>B.</given-names></name> <name><surname>Kuleshov</surname><given-names>V.</given-names></name> <name><surname>DePristo</surname><given-names>M.</given-names></name> <name><surname>Chou</surname><given-names>K.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>A guide to deep learning in healthcare</article-title>. <source>Nat. Med.</source> <volume>25</volume>, <fpage>24</fpage>&#x2013;<lpage>29</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41591-018-0316-z</pub-id>, PMID: <pub-id pub-id-type="pmid">30617335</pub-id></citation></ref>
<ref id="ref21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Falana</surname><given-names>W. O.</given-names></name> <name><surname>Serener</surname><given-names>A.</given-names></name> <name><surname>Serte</surname><given-names>S.</given-names></name></person-group> (<year>2023</year>). <article-title>Deep learning for comparative study of ovarian cancer detection on histopathological images</article-title>. <source>2023 7th Int. Symp. Multidiscip. Stud. Innov. Technol.</source>, <fpage>1</fpage>&#x2013;<lpage>6</lpage>. doi: <pub-id pub-id-type="doi">10.1109/ISMSIT58785.2023.10304913</pub-id></citation></ref>
<ref id="ref22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fan</surname><given-names>J.</given-names></name> <name><surname>Liu</surname><given-names>J.</given-names></name> <name><surname>Chen</surname><given-names>Q.</given-names></name> <name><surname>Wang</surname><given-names>W.</given-names></name> <name><surname>Wu</surname><given-names>Y.</given-names></name></person-group> (<year>2023</year>). <article-title>Accurate ovarian cyst classification with a lightweight deep learning model for ultrasound images</article-title>. <source>IEEE Access</source> <volume>11</volume>, <fpage>110681</fpage>&#x2013;<lpage>110691</lpage>. doi: <pub-id pub-id-type="doi">10.1109/ACCESS.2023.3321408</pub-id></citation></ref>
<ref id="ref23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gao</surname><given-names>Y.</given-names></name> <name><surname>Zeng</surname><given-names>S.</given-names></name> <name><surname>Xu</surname><given-names>X.</given-names></name> <name><surname>Li</surname><given-names>H.</given-names></name> <name><surname>Yao</surname><given-names>S.</given-names></name> <name><surname>Song</surname><given-names>K.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Deep learning-enabled pelvic ultrasound images for accurate diagnosis of ovarian cancer in China: a retrospective, multicentre, diagnostic study</article-title>. <source>Lancet Digit Health</source> <volume>4</volume>, <fpage>e179</fpage>&#x2013;<lpage>e187</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S2589-7500(21)00278-8</pub-id>, PMID: <pub-id pub-id-type="pmid">35216752</pub-id></citation></ref>
<ref id="ref24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Giourga</surname><given-names>M.</given-names></name> <name><surname>Petropoulos</surname><given-names>I.</given-names></name> <name><surname>Stavros</surname><given-names>S.</given-names></name> <name><surname>Potiris</surname><given-names>A.</given-names></name> <name><surname>Gerede</surname><given-names>A.</given-names></name> <name><surname>Sapantzoglou</surname><given-names>I.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Enhancing ovarian tumor diagnosis: performance of convolutional neural networks in classifying ovarian masses using ultrasound images</article-title>. <source>J. Clin. Med.</source> <volume>13</volume>:<fpage>4123</fpage>. doi: <pub-id pub-id-type="doi">10.3390/jcm13144123</pub-id>, PMID: <pub-id pub-id-type="pmid">39064163</pub-id></citation></ref>
<ref id="ref25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>He</surname><given-names>X.</given-names></name> <name><surname>Bai</surname><given-names>X.-H.</given-names></name> <name><surname>Chen</surname><given-names>H.</given-names></name> <name><surname>Feng</surname><given-names>W.-W.</given-names></name></person-group> (<year>2024</year>). <article-title>Machine learning models in evaluating the malignancy risk of ovarian tumors: a comparative study</article-title>. <source>J. Ovarian Res.</source> <volume>17</volume>:<fpage>219</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13048-024-01544-8</pub-id>, PMID: <pub-id pub-id-type="pmid">39506832</pub-id></citation></ref>
<ref id="ref26"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Heinlein</surname><given-names>L.</given-names></name> <name><surname>Maron</surname><given-names>R. C.</given-names></name> <name><surname>Hekler</surname><given-names>A.</given-names></name> <name><surname>Haggenm&#x00FC;ller</surname><given-names>S.</given-names></name> <name><surname>Wies</surname><given-names>C.</given-names></name> <name><surname>Utikal</surname><given-names>J. S.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Clinical melanoma diagnosis with artificial intelligence: insights from a prospective multicenter study</article-title>. arXiv. [Preprint]. doi: <pub-id pub-id-type="doi">10.48550/arXiv.2401.14193</pub-id></citation></ref>
<ref id="ref27"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Ho</surname><given-names>D. J.</given-names></name> <name><surname>Chui</surname><given-names>M. H.</given-names></name> <name><surname>Vanderbilt</surname><given-names>C. M.</given-names></name> <name><surname>Jung</surname><given-names>J.</given-names></name> <name><surname>Robson</surname><given-names>M. E.</given-names></name> <name><surname>Park</surname><given-names>C.-S.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Deep interactive learning-based ovarian cancer segmentation of H&#x0026;E-stained whole slide images to study morphological patterns of BRCA mutation</article-title>. arXiv. [Preprint]. doi: <pub-id pub-id-type="doi">10.48550/arXiv.2203.15015</pub-id></citation></ref>
<ref id="ref28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hussein</surname><given-names>I. J.</given-names></name> <name><surname>Burhanuddin</surname><given-names>M. A.</given-names></name> <name><surname>Mohammed</surname><given-names>M. A.</given-names></name> <name><surname>Benameur</surname><given-names>N.</given-names></name> <name><surname>Maashi</surname><given-names>M. S.</given-names></name> <name><surname>Maashi</surname><given-names>M. S.</given-names></name></person-group> (<year>2022</year>). <article-title>Fully-automatic identification of gynaecological abnormality using a new adaptive frequency filter and histogram of oriented gradients (HOG)</article-title>. <source>Expert. Syst.</source> <volume>39</volume>:<fpage>e12789</fpage>. doi: <pub-id pub-id-type="doi">10.1111/exsy.12789</pub-id></citation></ref>
<ref id="ref29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hussein</surname><given-names>I. J.</given-names></name> <name><surname>Burhanuddin</surname><given-names>M.</given-names></name> <name><surname>Mohammed</surname><given-names>M.</given-names></name> <name><surname>Elhoseny</surname><given-names>M.</given-names></name> <name><surname>Garcia-Zapirain</surname><given-names>B.</given-names></name> <name><surname>Maashi</surname><given-names>M.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Fully automatic segmentation of gynaecological abnormality using a new Viola&#x2013;Jones model</article-title>. <source>Comput. Mater. Contin.</source> <volume>66</volume>, <fpage>3161</fpage>&#x2013;<lpage>3182</lpage>. doi: <pub-id pub-id-type="doi">10.32604/cmc.2021.012691</pub-id></citation></ref>
<ref id="ref30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jacobs</surname><given-names>L.</given-names></name> <name><surname>Menon</surname><given-names>U.</given-names></name></person-group> (<year>2004</year>). <article-title>Progress and challenges in screening for early detection of ovarian cancer</article-title>. <source>Mol. Cell Proteomics</source> <volume>3</volume>, <fpage>355</fpage>&#x2013;<lpage>366</lpage>. doi: <pub-id pub-id-type="doi">10.1074/mcp.R400006-MCP200</pub-id></citation></ref>
<ref id="ref31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jeevitha</surname><given-names>S.</given-names></name> <name><surname>Priya</surname><given-names>N.</given-names></name></person-group> (<year>2022</year>). <article-title>Identifying and classifying an ovarian cyst using SCBOD (size and count-based ovarian detection) algorithm in ultrasound image</article-title>. <source>Int. J. Electr. Comp. Eng. Syst.</source> <volume>13</volume>, <fpage>799</fpage>&#x2013;<lpage>806</lpage>. doi: <pub-id pub-id-type="doi">10.32985/ijeces.13.9.8</pub-id></citation></ref>
<ref id="ref32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kelly</surname><given-names>C. J.</given-names></name> <name><surname>Karthikesalingam</surname><given-names>A.</given-names></name> <name><surname>Suleyman</surname><given-names>M.</given-names></name> <name><surname>Corrado</surname><given-names>G.</given-names></name> <name><surname>King</surname><given-names>D.</given-names></name></person-group> (<year>2019</year>). <article-title>Key challenges for delivering clinical impact with artificial intelligence</article-title>. <source>BMC Med.</source> <volume>17</volume>:<fpage>195</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12916-019-1426-2</pub-id>, PMID: <pub-id pub-id-type="pmid">31665002</pub-id></citation></ref>
<ref id="ref33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kiruthika</surname><given-names>V.</given-names></name> <name><surname>Sathiya</surname><given-names>S.</given-names></name> <name><surname>Ramya</surname><given-names>M. M.</given-names></name> <name><surname>Sakthidasan Sankaran</surname><given-names>K.</given-names></name></person-group> (<year>2023</year>). <article-title>An intelligent machine learning approach for ovarian detection and classification system using ultrasonogram images</article-title>. <source>Eng. Sci.</source> <volume>23</volume>:<fpage>879</fpage>. doi: <pub-id pub-id-type="doi">10.1201/9781003224068-2</pub-id>, PMID: <pub-id pub-id-type="pmid">41070723</pub-id></citation></ref>
<ref id="ref34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kongara</surname><given-names>S. R.</given-names></name> <name><surname>Prakasha</surname><given-names>S.</given-names></name> <name><surname>Brindha</surname><given-names>A.</given-names></name> <name><surname>Pathak</surname><given-names>S. K.</given-names></name> <name><surname>Miya</surname><given-names>J.</given-names></name> <name><surname>Taqui</surname><given-names>S. N.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Performance evaluation of optimized convolutional neural network mechanism in the detection and classification of ovarian cancer</article-title>. <source>Multimed. Tools Appl.</source> <volume>83</volume>, <fpage>71311</fpage>&#x2013;<lpage>71334</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11042-024-18115-0</pub-id></citation></ref>
<ref id="ref35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>J.</given-names></name> <name><surname>Chen</surname><given-names>Y.</given-names></name> <name><surname>Zhang</surname><given-names>M.</given-names></name> <name><surname>Zhang</surname><given-names>P.</given-names></name> <name><surname>He</surname><given-names>K.</given-names></name> <name><surname>Yan</surname><given-names>F.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>A deep learning model system for diagnosis and management of adnexal masses</article-title>. <source>Cancer</source> <volume>14</volume>:<fpage>5291</fpage>. doi: <pub-id pub-id-type="doi">10.3390/cancers14215291</pub-id>, PMID: <pub-id pub-id-type="pmid">36358710</pub-id></citation></ref>
<ref id="ref36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>L.</given-names></name> <name><surname>He</surname><given-names>L.</given-names></name> <name><surname>Guo</surname><given-names>W.</given-names></name> <name><surname>Ma</surname><given-names>J.</given-names></name> <name><surname>Sun</surname><given-names>G.</given-names></name> <name><surname>Ma</surname><given-names>H.</given-names></name></person-group> (<year>2024</year>). <article-title>PMFFNet: a hybrid network based on feature pyramid for ovarian tumor segmentation</article-title>. <source>PLoS One</source> <volume>19</volume>:<fpage>e0299360</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0299360</pub-id>, PMID: <pub-id pub-id-type="pmid">38557660</pub-id></citation></ref>
<ref id="ref37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liberati</surname><given-names>A.</given-names></name> <name><surname>Altman</surname><given-names>D. G.</given-names></name> <name><surname>Tetzlaff</surname><given-names>J.</given-names></name> <name><surname>Mulrow</surname><given-names>C.</given-names></name> <name><surname>G&#x00F8;tzsche</surname><given-names>P. C.</given-names></name> <name><surname>Ioannidis</surname><given-names>J. P. A.</given-names></name> <etal/></person-group>. (<year>2009</year>). <article-title>The PRISMA statement for reporting systematic reviews and meta-analyses of studies that evaluate health care interventions: explanation and elaboration</article-title>. <source>J. Clin. Epidemiol.</source> <volume>62</volume>, <fpage>e1</fpage>&#x2013;<lpage>e34</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jclinepi.2009.06.006</pub-id>, PMID: <pub-id pub-id-type="pmid">19631507</pub-id></citation></ref>
<ref id="ref38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Litjens</surname><given-names>G.</given-names></name> <name><surname>Kooi</surname><given-names>T.</given-names></name> <name><surname>Bejnordi</surname><given-names>B. E.</given-names></name> <name><surname>Setio</surname><given-names>A. A. A.</given-names></name> <name><surname>Ciompi</surname><given-names>F.</given-names></name> <name><surname>Ghafoorian</surname><given-names>M.</given-names></name> <etal/></person-group>. (<year>2017</year>). <article-title>A survey on deep learning in medical image analysis</article-title>. <source>Med. Image Anal.</source> <volume>42</volume>, <fpage>60</fpage>&#x2013;<lpage>88</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.media.2017.07.005</pub-id>, PMID: <pub-id pub-id-type="pmid">28778026</pub-id></citation></ref>
<ref id="ref39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname><given-names>L.</given-names></name> <name><surname>Cai</surname><given-names>W.</given-names></name> <name><surname>Tian</surname><given-names>H.</given-names></name> <name><surname>Wu</surname><given-names>B.</given-names></name> <name><surname>Zhang</surname><given-names>J.</given-names></name> <name><surname>Wang</surname><given-names>T.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Ultrasound image-based nomogram combining clinical, radiomics, and deep transfer learning features for automatic classification of ovarian masses according to O-RADS</article-title>. <source>Front. Oncol.</source> <volume>14</volume>:<fpage>1377489</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fonc.2024.1377489</pub-id>, PMID: <pub-id pub-id-type="pmid">38812784</pub-id></citation></ref>
<ref id="ref40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname><given-names>L.</given-names></name> <name><surname>Cai</surname><given-names>W.</given-names></name> <name><surname>Zhou</surname><given-names>C.</given-names></name> <name><surname>Tian</surname><given-names>H.</given-names></name> <name><surname>Wu</surname><given-names>B.</given-names></name> <name><surname>Zhang</surname><given-names>J.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Ultrasound radiomics-based artificial intelligence model to assist in the differential diagnosis of ovarian endometrioma and ovarian dermoid cyst</article-title>. <source>Front. Med.</source> <volume>11</volume>:<fpage>11</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fmed.2024.1362588</pub-id>, PMID: <pub-id pub-id-type="pmid">38523908</pub-id></citation></ref>
<ref id="ref41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname><given-names>X.</given-names></name> <name><surname>Faes</surname><given-names>L.</given-names></name> <name><surname>Kale</surname><given-names>A. U.</given-names></name> <name><surname>Wagner</surname><given-names>S. K.</given-names></name> <name><surname>Fu</surname><given-names>D. J.</given-names></name> <name><surname>Bruynseels</surname><given-names>A.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>A comparison of deep learning performance against health-care professionals in detecting diseases from medical imaging: a systematic review and meta-analysis</article-title>. <source>Lancet Digit Health</source> <volume>1</volume>, <fpage>e271</fpage>&#x2013;<lpage>e297</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S2589-7500(19)30123-2</pub-id>, PMID: <pub-id pub-id-type="pmid">33323251</pub-id></citation></ref>
<ref id="ref42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname><given-names>X.</given-names></name> <name><surname>Song</surname><given-names>Y.</given-names></name> <name><surname>Cheng</surname><given-names>P.</given-names></name> <name><surname>Liang</surname><given-names>B.</given-names></name> <name><surname>Xing</surname><given-names>D.</given-names></name></person-group> (<year>2024</year>). <article-title>Targeting HER2 in solid tumors: unveiling the structure and novel epitopes</article-title>. <source>Cancer Treat. Rev.</source> <volume>130</volume>:<fpage>102826</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ctrv.2024.102826</pub-id>, PMID: <pub-id pub-id-type="pmid">39270365</pub-id></citation></ref>
<ref id="ref43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ma</surname><given-names>Q.</given-names></name> <name><surname>Jiang</surname><given-names>H.</given-names></name> <name><surname>Ma</surname><given-names>L.</given-names></name> <name><surname>Zhao</surname><given-names>G.</given-names></name> <name><surname>Xu</surname><given-names>Q.</given-names></name> <name><surname>Guo</surname><given-names>D.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>The moonlighting function of glycolytic enzyme enolase-1 promotes choline phospholipid metabolism and tumor cell proliferation</article-title>. <source>Proc. Natl. Acad. Sci. USA</source> <volume>120</volume>:<fpage>e2209435120</fpage>. doi: <pub-id pub-id-type="doi">10.1073/pnas.2209435120</pub-id>, PMID: <pub-id pub-id-type="pmid">37011206</pub-id></citation></ref>
<ref id="ref44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mart&#x00ED;nez-M&#x00E1;s</surname><given-names>J.</given-names></name> <name><surname>Bueno-Crespo</surname><given-names>A.</given-names></name> <name><surname>Khazendar</surname><given-names>S.</given-names></name> <name><surname>Remezal-Solano</surname><given-names>M.</given-names></name> <name><surname>Mart&#x00ED;nez-Cend&#x00E1;n</surname><given-names>J.-P.</given-names></name> <name><surname>Jassim</surname><given-names>S.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>Evaluation of machine learning methods with Fourier transform features for classifying ovarian tumors based on ultrasound images</article-title>. <source>PLoS One</source> <volume>14</volume>:<fpage>e0219388</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0219388</pub-id>, PMID: <pub-id pub-id-type="pmid">31348783</pub-id></citation></ref>
<ref id="ref45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Meijing</surname><given-names>W.</given-names></name> <name><surname>Guangxia</surname><given-names>C.</given-names></name> <name><surname>Shuchang</surname><given-names>L.</given-names></name> <name><surname>Lijiang</surname><given-names>C.</given-names></name> <name><surname>Zongmei</surname><given-names>T.</given-names></name> <name><surname>Min</surname><given-names>Y.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Deep convolutional neural networks for multiple histologic types of ovarian tumors classification in ultrasound images</article-title>. <source>Front. Oncol.</source> <volume>13</volume>:<fpage>1154200</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fonc.2023.1154200</pub-id></citation></ref>
<ref id="ref46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Menze</surname><given-names>B. H.</given-names></name> <name><surname>Jakab</surname><given-names>A.</given-names></name> <name><surname>Bauer</surname><given-names>S.</given-names></name> <name><surname>Kalpathy-Cramer</surname><given-names>J.</given-names></name> <name><surname>Farahani</surname><given-names>K.</given-names></name> <name><surname>Kirby</surname><given-names>J.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>The multimodal brain tumor image segmentation benchmark (BRATS)</article-title>. <source>IEEE Trans. Med. Imaging</source> <volume>34</volume>, <fpage>1993</fpage>&#x2013;<lpage>2024</lpage>. doi: <pub-id pub-id-type="doi">10.1109/TMI.2014.2377694</pub-id>, PMID: <pub-id pub-id-type="pmid">25494501</pub-id></citation></ref>
<ref id="ref47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Miao</surname><given-names>K.</given-names></name> <name><surname>Lv</surname><given-names>Q.</given-names></name> <name><surname>Zhang</surname><given-names>L.</given-names></name> <name><surname>Zhao</surname><given-names>N.</given-names></name> <name><surname>Dong</surname><given-names>X.</given-names></name></person-group> (<year>2024</year>). <article-title>Discriminative diagnosis of ovarian endometriosis cysts and benign mucinous cystadenomas based on the ConvNeXt algorithm</article-title>. <source>Eur. J. Obstet. Gynecol. Reprod. Biol.</source> <volume>298</volume>, <fpage>135</fpage>&#x2013;<lpage>139</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ejogrb.2024.05.010</pub-id>, PMID: <pub-id pub-id-type="pmid">38756053</pub-id></citation></ref>
<ref id="ref48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Miao</surname><given-names>K.</given-names></name> <name><surname>Zhao</surname><given-names>N.</given-names></name> <name><surname>Lv</surname><given-names>Q.</given-names></name> <name><surname>He</surname><given-names>X.</given-names></name> <name><surname>Xu</surname><given-names>M.</given-names></name> <name><surname>Dong</surname><given-names>X.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Prediction of benign and malignant ovarian tumors using Resnet34 on ultrasound images</article-title>. <source>J. Obstet. Gynaecol. Res.</source> <volume>49</volume>, <fpage>2910</fpage>&#x2013;<lpage>2917</lpage>. doi: <pub-id pub-id-type="doi">10.1111/jog.15788</pub-id>, PMID: <pub-id pub-id-type="pmid">37696522</pub-id></citation></ref>
<ref id="ref49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Moro</surname><given-names>F.</given-names></name> <name><surname>Vagni</surname><given-names>M.</given-names></name> <name><surname>Tran</surname><given-names>H. E.</given-names></name> <name><surname>Bernardini</surname><given-names>F.</given-names></name> <name><surname>Mascilini</surname><given-names>F.</given-names></name> <name><surname>Ciccarone</surname><given-names>F.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Radiomics analysis of ultrasound images to discriminate between benign and malignant adnexal masses with solid ultrasound morphology</article-title>. <source>Ultrasound Obstet. Gynecol. Off. J. Int. Soc.</source> <volume>65</volume>, <fpage>353</fpage>&#x2013;<lpage>363</lpage>. doi: <pub-id pub-id-type="doi">10.1002/uog.27680</pub-id></citation></ref>
<ref id="ref50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Narmatha</surname><given-names>C.</given-names></name> <name><surname>Manimegalai</surname><given-names>P.</given-names></name> <name><surname>Krishnadass</surname><given-names>J.</given-names></name> <name><surname>Valsalan</surname><given-names>P.</given-names></name> <name><surname>Manimurugan</surname><given-names>S.</given-names></name> <name><surname>Mustafa</surname><given-names>M.</given-names></name></person-group> (<year>2023</year>). <article-title>Ovarian cysts classification using novel deep reinforcement learning with Harris hawks optimization method</article-title>. <source>J. Supercomput.</source> <volume>79</volume>, <fpage>1374</fpage>&#x2013;<lpage>1397</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11227-022-04709-8</pub-id></citation></ref>
<ref id="ref51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nebgen</surname><given-names>D. R.</given-names></name> <name><surname>Lu</surname><given-names>K. H.</given-names></name> <name><surname>Bast</surname><given-names>R. C.</given-names></name></person-group> (<year>2019</year>). <article-title>Novel approaches to ovarian cancer screening</article-title>. <source>Curr. Oncol. Rep.</source> <volume>21</volume>:<fpage>75</fpage>. doi: <pub-id pub-id-type="doi">10.1007/s11912-019-0816-0</pub-id>, PMID: <pub-id pub-id-type="pmid">31346778</pub-id></citation></ref>
<ref id="ref52"><citation citation-type="other"><person-group person-group-type="author"><collab id="coll1">NIH</collab></person-group>. <article-title>Cancer stat facts: ovarian cancer</article-title>. (<year>2020</year>). Available online at: <ext-link xlink:href="https://seer.cancer.gov/statfacts/html/ovary.html" ext-link-type="uri">https://seer.cancer.gov/statfacts/html/ovary.html</ext-link> (Accessed June 10, 2025).</citation></ref>
<ref id="ref53"><citation citation-type="other"><person-group person-group-type="author"><collab id="coll2">NIH</collab></person-group>. <article-title>The cancer imaging archive</article-title>. (<year>n.d.</year>). Available online at: <ext-link xlink:href="https://www.cancerimagingarchive.net/" ext-link-type="uri">https://www.cancerimagingarchive.net/</ext-link> (Accessed June 10, 2025).</citation></ref>
<ref id="ref54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Noseworthy</surname><given-names>P. A.</given-names></name> <name><surname>Attia</surname><given-names>Z. I.</given-names></name> <name><surname>Brewer</surname><given-names>L. C.</given-names></name> <name><surname>Hayes</surname><given-names>S. N.</given-names></name> <name><surname>Yao</surname><given-names>X.</given-names></name> <name><surname>Kapa</surname><given-names>S.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Assessing and mitigating bias in medical artificial intelligence</article-title>. <source>Circ. Arrhythm. Electrophysiol.</source> <volume>13</volume>:<fpage>e007988</fpage>. doi: <pub-id pub-id-type="doi">10.1161/CIRCEP.119.007988</pub-id>, PMID: <pub-id pub-id-type="pmid">32064914</pub-id></citation></ref>
<ref id="ref55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Page</surname><given-names>M. J.</given-names></name> <name><surname>McKenzie</surname><given-names>J. E.</given-names></name> <name><surname>Bossuyt</surname><given-names>P. M.</given-names></name> <name><surname>Boutron</surname><given-names>I.</given-names></name> <name><surname>Hoffmann</surname><given-names>T. C.</given-names></name> <name><surname>Mulrow</surname><given-names>C. D.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>The PRISMA 2020 statement: an updated guideline for reporting systematic reviews</article-title>. <source>BMJ</source> <volume>372</volume>:<fpage>n71</fpage>. doi: <pub-id pub-id-type="doi">10.1136/bmj.n71</pub-id></citation></ref>
<ref id="ref56"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Patil</surname><given-names>S. D.</given-names></name> <name><surname>Deore</surname><given-names>P. J.</given-names></name> <name><surname>Patil</surname><given-names>V. B.</given-names></name></person-group> (<year>2024</year>). <article-title>An intelligent computer aided diagnosis system for classification of ovarian masses using machine learning approach</article-title>. <source>Int. Res. J. Multidiscip. Technov.</source> <volume>6</volume>, <fpage>45</fpage>&#x2013;<lpage>57</lpage>. doi: <pub-id pub-id-type="doi">10.54392/irjmt2434</pub-id></citation></ref>
<ref id="ref57"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pham</surname><given-names>T.-L.</given-names></name> <name><surname>Le</surname><given-names>V.-H.</given-names></name></person-group> (<year>2024</year>). <article-title>Ovarian tumors detection and classification from ultrasound images based on YOLOv8</article-title>. <source>J. Adv. Inf. Technol.</source> <volume>15</volume>, <fpage>264</fpage>&#x2013;<lpage>275</lpage>. doi: <pub-id pub-id-type="doi">10.12720/jait.15.2.264-275</pub-id></citation></ref>
<ref id="ref58"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Raciti</surname><given-names>P.</given-names></name> <name><surname>Sue</surname><given-names>J.</given-names></name> <name><surname>Retamero</surname><given-names>J. A.</given-names></name> <name><surname>Ceballos</surname><given-names>R.</given-names></name> <name><surname>Godrich</surname><given-names>R.</given-names></name> <name><surname>Kunz</surname><given-names>J. D.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Clinical validation of artificial intelligence&#x2013;augmented pathology diagnosis demonstrates significant gains in diagnostic accuracy in prostate Cancer detection</article-title>. <source>Arch. Pathol. Lab Med.</source> <volume>147</volume>, <fpage>1178</fpage>&#x2013;<lpage>1185</lpage>. doi: <pub-id pub-id-type="doi">10.5858/arpa.2022-0066-OA</pub-id>, PMID: <pub-id pub-id-type="pmid">36538386</pub-id></citation></ref>
<ref id="ref59"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ravishankar</surname><given-names>T. N.</given-names></name> <name><surname>Makarand Jadhav</surname><given-names>H.</given-names></name> <name><surname>Satheesh Kumar</surname><given-names>N.</given-names></name> <name><surname>Ambala</surname><given-names>S.</given-names></name> <name><surname>Pillai</surname><given-names>N. M.</given-names></name></person-group> (<year>2023</year>). <article-title>A deep learning approach for ovarian cysts detection and classification (OCD-FCNN) using fuzzy convolutional neural network</article-title>. <source>Meas. Sens.</source> <volume>27</volume>:<fpage>100797</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.measen.2023.100797</pub-id></citation></ref>
<ref id="ref60"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Roberts</surname><given-names>M.</given-names></name> <name><surname>Driggs</surname><given-names>D.</given-names></name> <name><surname>Thorpe</surname><given-names>M.</given-names></name> <name><surname>Gilbey</surname><given-names>J.</given-names></name> <name><surname>Yeung</surname><given-names>M.</given-names></name> <name><surname>Ursprung</surname><given-names>S.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Common pitfalls and recommendations for using machine learning to detect and prognosticate for COVID-19 using chest radiographs and CT scans</article-title>. <source>Nat. Mach. Intell.</source> <volume>3</volume>, <fpage>199</fpage>&#x2013;<lpage>217</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s42256-021-00307-0</pub-id></citation></ref>
<ref id="ref61"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rosati</surname><given-names>A.</given-names></name> <name><surname>Gueli Alletti</surname><given-names>S.</given-names></name> <name><surname>Capozzi</surname><given-names>V. A.</given-names></name> <name><surname>Mirandola</surname><given-names>M.</given-names></name> <name><surname>Vargiu</surname><given-names>V.</given-names></name> <name><surname>Fedele</surname><given-names>C.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Role of ultrasound in the detection of recurrent ovarian cancer: a review of the literature</article-title>. <source>Gland Surg.</source> <volume>9</volume>, <fpage>1092</fpage>&#x2013;<lpage>1101</lpage>. doi: <pub-id pub-id-type="doi">10.21037/gs-20-357</pub-id>, PMID: <pub-id pub-id-type="pmid">32953624</pub-id></citation></ref>
<ref id="ref62"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sadeghi</surname><given-names>M. H.</given-names></name> <name><surname>Sina</surname><given-names>S.</given-names></name> <name><surname>Omidi</surname><given-names>H.</given-names></name> <name><surname>Farshchitabrizi</surname><given-names>A. H.</given-names></name> <name><surname>Alavi</surname><given-names>M.</given-names></name></person-group> (<year>2024</year>). <article-title>Deep learning in ovarian cancer diagnosis: a comprehensive review of various imaging modalities</article-title>. <source>Pol. J. Radiol.</source> <volume>89</volume>, <fpage>30</fpage>&#x2013;<lpage>48</lpage>. doi: <pub-id pub-id-type="doi">10.5114/pjr.2024.134817</pub-id>, PMID: <pub-id pub-id-type="pmid">38371888</pub-id></citation></ref>
<ref id="ref63"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sahu</surname><given-names>S. A.</given-names></name> <name><surname>Shrivastava</surname><given-names>D.</given-names></name></person-group> (<year>2023</year>). <article-title>A comprehensive review of screening methods for ovarian masses: towards earlier detection</article-title>. <source>Cureus</source> <volume>15</volume>:<fpage>e48534</fpage>. doi: <pub-id pub-id-type="doi">10.7759/cureus.48534</pub-id>, PMID: <pub-id pub-id-type="pmid">38084173</pub-id></citation></ref>
<ref id="ref64"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sha</surname><given-names>M.</given-names></name></person-group> (<year>2024</year>). <article-title>Segmentation of ovarian cyst in ultrasound images using AdaResU-net with optimization algorithm and deep learning model</article-title>. <source>Sci. Rep.</source> <volume>14</volume>:<fpage>18868</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-024-69427-y</pub-id>, PMID: <pub-id pub-id-type="pmid">39143122</pub-id></citation></ref>
<ref id="ref65"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shih-Tien</surname><given-names>H.</given-names></name> <name><surname>Yu-Jie</surname><given-names>S.</given-names></name> <name><surname>Chian-Huei</surname><given-names>H.</given-names></name> <name><surname>Ming-Jer</surname><given-names>C.</given-names></name> <name><surname>Chien-Hsing</surname><given-names>L.</given-names></name> <name><surname>Chih-En</surname><given-names>K.</given-names></name></person-group> (<year>2022</year>). <article-title>Automatic ovarian tumors recognition system based on ensemble convolutional neural network with ultrasound imaging</article-title>. <source>BMC Med. Inform. Decis. Mak.</source> <volume>22</volume>:<fpage>298</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12911-022-02047-6</pub-id></citation></ref>
<ref id="ref66"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Siegel</surname><given-names>R. L.</given-names></name> <name><surname>Miller</surname><given-names>K. D.</given-names></name> <name><surname>Fuchs</surname><given-names>H. E.</given-names></name> <name><surname>Jemal</surname><given-names>A.</given-names></name></person-group> (<year>2021</year>). <article-title>Cancer statistics, 2021</article-title>. <source>CA Cancer J. Clin.</source> <volume>71</volume>, <fpage>7</fpage>&#x2013;<lpage>33</lpage>. doi: <pub-id pub-id-type="doi">10.3322/caac.21654</pub-id>, PMID: <pub-id pub-id-type="pmid">33433946</pub-id></citation></ref>
<ref id="ref67"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sone</surname><given-names>K.</given-names></name> <name><surname>Toyohara</surname><given-names>Y.</given-names></name> <name><surname>Taguchi</surname><given-names>A.</given-names></name> <name><surname>Miyamoto</surname><given-names>Y.</given-names></name> <name><surname>Tanikawa</surname><given-names>M.</given-names></name> <name><surname>Uchino-Mori</surname><given-names>M.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Application of artificial intelligence in gynecologic malignancies: a review</article-title>. <source>J. Obstet. Gynaecol. Res.</source> <volume>47</volume>, <fpage>2577</fpage>&#x2013;<lpage>2585</lpage>. doi: <pub-id pub-id-type="doi">10.1111/jog.14818</pub-id>, PMID: <pub-id pub-id-type="pmid">33973305</pub-id></citation></ref>
<ref id="ref68"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sounderajah</surname><given-names>V.</given-names></name> <name><surname>Ashrafian</surname><given-names>H.</given-names></name> <name><surname>Golub</surname><given-names>R. M.</given-names></name> <name><surname>Shetty</surname><given-names>S.</given-names></name> <name><surname>De Fauw</surname><given-names>J.</given-names></name> <name><surname>Hooft</surname><given-names>L.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Developing a reporting guideline for artificial intelligence-centred diagnostic test accuracy studies: the STARD-AI protocol</article-title>. <source>BMJ Open</source> <volume>11</volume>:<fpage>e047709</fpage>. doi: <pub-id pub-id-type="doi">10.1136/bmjopen-2020-047709</pub-id>, PMID: <pub-id pub-id-type="pmid">34183345</pub-id></citation></ref>
<ref id="ref69"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>&#x0218;tefan</surname><given-names>P.-A.</given-names></name> <name><surname>Lupean</surname><given-names>R.-A.</given-names></name> <name><surname>Mihu</surname><given-names>C. M.</given-names></name> <name><surname>Lebovici</surname><given-names>A.</given-names></name> <name><surname>Oancea</surname><given-names>M. D.</given-names></name> <name><surname>Hu</surname><given-names>L.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Ultrasonography in the diagnosis of adnexal lesions: the role of texture analysis</article-title>. <source>Diagnostics</source> <volume>11</volume>:<fpage>812</fpage>. doi: <pub-id pub-id-type="doi">10.3390/diagnostics11050812</pub-id>, PMID: <pub-id pub-id-type="pmid">33947150</pub-id></citation></ref>
<ref id="ref70"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Taha</surname><given-names>A. A.</given-names></name> <name><surname>Hanbury</surname><given-names>A.</given-names></name></person-group> (<year>2015</year>). <article-title>Metrics for evaluating 3D medical image segmentation: analysis, selection, and tool</article-title>. <source>BMC Med. Imaging</source> <volume>15</volume>:<fpage>29</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12880-015-0068-x</pub-id>, PMID: <pub-id pub-id-type="pmid">26263899</pub-id></citation></ref>
<ref id="ref71"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tang</surname><given-names>Z.-P.</given-names></name> <name><surname>Ma</surname><given-names>Z.</given-names></name> <name><surname>He</surname><given-names>Y.</given-names></name> <name><surname>Liu</surname><given-names>R.-C.</given-names></name> <name><surname>Jin</surname><given-names>B.-B.</given-names></name> <name><surname>Wen</surname><given-names>D.-Y.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Ultrasound-based radiomics for predicting different pathological subtypes of epithelial ovarian cancer before surgery</article-title>. <source>BMC Med. Imaging</source> <volume>22</volume>:<fpage>147</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12880-022-00879-2</pub-id>, PMID: <pub-id pub-id-type="pmid">35996097</pub-id></citation></ref>
<ref id="ref72"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Torre</surname><given-names>L. A.</given-names></name> <name><surname>Trabert</surname><given-names>B.</given-names></name> <name><surname>DeSantis</surname><given-names>C. E.</given-names></name> <name><surname>Miller</surname><given-names>K. D.</given-names></name> <name><surname>Samimi</surname><given-names>G.</given-names></name> <name><surname>Runowicz</surname><given-names>C. D.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Ovarian cancer statistics, 2018</article-title>. <source>CA Cancer J. Clin.</source> <volume>68</volume>, <fpage>284</fpage>&#x2013;<lpage>296</lpage>. doi: <pub-id pub-id-type="doi">10.3322/caac.21456</pub-id>, PMID: <pub-id pub-id-type="pmid">29809280</pub-id></citation></ref>
<ref id="ref73"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>H.</given-names></name> <name><surname>Liu</surname><given-names>C.</given-names></name> <name><surname>Zhao</surname><given-names>Z.</given-names></name> <name><surname>Zhang</surname><given-names>C.</given-names></name> <name><surname>Wang</surname><given-names>X.</given-names></name> <name><surname>Li</surname><given-names>H.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Application of deep convolutional neural networks for discriminating benign, borderline, and malignant serous ovarian tumors from ultrasound images</article-title>. <source>Front. Oncol.</source> <volume>11</volume>:<fpage>770683</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fonc.2021.770683</pub-id>, PMID: <pub-id pub-id-type="pmid">34988015</pub-id></citation></ref>
<ref id="ref74"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>Z.</given-names></name> <name><surname>Luo</surname><given-names>S.</given-names></name> <name><surname>Chen</surname><given-names>J.</given-names></name> <name><surname>Jiao</surname><given-names>Y.</given-names></name> <name><surname>Cui</surname><given-names>C.</given-names></name> <name><surname>Shi</surname><given-names>S.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Multi-modality deep learning model reaches high prediction accuracy in the diagnosis of ovarian cancer</article-title>. <source>iScience</source> <volume>27</volume>:<fpage>109403</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.isci.2024.109403</pub-id>, PMID: <pub-id pub-id-type="pmid">38523785</pub-id></citation></ref>
<ref id="ref75"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wolff</surname><given-names>R. F.</given-names></name> <name><surname>Moons</surname><given-names>K. G. M.</given-names></name> <name><surname>Riley</surname><given-names>R. D.</given-names></name> <name><surname>Whiting</surname><given-names>P. F.</given-names></name> <name><surname>Westwood</surname><given-names>M.</given-names></name> <name><surname>Collins</surname><given-names>G. S.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>PROBAST: a tool to assess the risk of Bias and applicability of prediction model studies</article-title>. <source>Ann. Intern. Med.</source> <volume>170</volume>, <fpage>51</fpage>&#x2013;<lpage>58</lpage>. doi: <pub-id pub-id-type="doi">10.7326/M18-1376</pub-id>, PMID: <pub-id pub-id-type="pmid">30596875</pub-id></citation></ref>
<ref id="ref76"><citation citation-type="confproc"><person-group person-group-type="author"><name><surname>Wu</surname><given-names>C.</given-names></name> <name><surname>Wang</surname><given-names>Y.</given-names></name> <name><surname>Wang</surname><given-names>F.</given-names></name></person-group> <article-title>Deep learning for ovarian tumor classification with ultrasound images</article-title>. <conf-name>Pacific RIM Conference on Multimedia</conf-name> (<year>2018</year>). p. <fpage>395</fpage>&#x2013;<lpage>406</lpage>.</citation></ref>
<ref id="ref77"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xi</surname><given-names>M.</given-names></name> <name><surname>Zheng</surname><given-names>R.</given-names></name> <name><surname>Wang</surname><given-names>M.</given-names></name> <name><surname>Shi</surname><given-names>X.</given-names></name> <name><surname>Chen</surname><given-names>C.</given-names></name> <name><surname>Qian</surname><given-names>J.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Ultrasonographic diagnosis of ovarian tumors through the deep convolutional neural network</article-title>. <source>Ginekol. Pol.</source> <volume>95</volume>, <fpage>181</fpage>&#x2013;<lpage>189</lpage>. doi: <pub-id pub-id-type="doi">10.5603/gpl.94956</pub-id>, PMID: <pub-id pub-id-type="pmid">37842987</pub-id></citation></ref>
<ref id="ref78"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xiang</surname><given-names>H.</given-names></name> <name><surname>Xiao</surname><given-names>Y.</given-names></name> <name><surname>Li</surname><given-names>F.</given-names></name> <name><surname>Li</surname><given-names>C.</given-names></name> <name><surname>Liu</surname><given-names>L.</given-names></name> <name><surname>Deng</surname><given-names>T.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Development and validation of an interpretable model integrating multimodal information for improving ovarian cancer diagnosis</article-title>. <source>Nat. Commun.</source> <volume>15</volume>:<fpage>2681</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41467-024-46700-2</pub-id>, PMID: <pub-id pub-id-type="pmid">38538600</pub-id></citation></ref>
<ref id="ref79"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xie</surname><given-names>W.</given-names></name> <name><surname>Lin</surname><given-names>W.</given-names></name> <name><surname>Li</surname><given-names>P.</given-names></name> <name><surname>Lai</surname><given-names>H.</given-names></name> <name><surname>Wang</surname><given-names>Z.</given-names></name> <name><surname>Liu</surname><given-names>P.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Developing a deep learning model for predicting ovarian cancer in ovarian-adnexal reporting and data system ultrasound (O-RADS US) category 4 lesions: a multicenter study</article-title>. <source>J. Cancer Res. Clin. Oncol.</source> <volume>150</volume>:<fpage>346</fpage>. doi: <pub-id pub-id-type="doi">10.1007/s00432-024-05872-6</pub-id>, PMID: <pub-id pub-id-type="pmid">38981916</pub-id></citation></ref>
<ref id="ref80"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yuyeon</surname><given-names>J.</given-names></name> <name><surname>Taewan</surname><given-names>K.</given-names></name> <name><surname>Mi-Ryung</surname><given-names>H.</given-names></name> <name><surname>Sejin</surname><given-names>K.</given-names></name> <name><surname>Geunyoung</surname><given-names>K.</given-names></name> <name><surname>Seungchul</surname><given-names>L.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Ovarian tumor diagnosis using deep convolutional neural networks and a denoising convolutional autoencoder</article-title>. <source>Sci. Rep.</source> <volume>12</volume>:<fpage>17024</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-022-20653-2</pub-id></citation></ref>
</ref-list>
</back>
</article>