<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Cell Dev. Biol.</journal-id>
<journal-title>Frontiers in Cell and Developmental Biology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Cell Dev. Biol.</abbrev-journal-title>
<issn pub-type="epub">2296-634X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1532228</article-id>
<article-id pub-id-type="doi">10.3389/fcell.2024.1532228</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Cell and Developmental Biology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>A multi-modal multi-branch framework for retinal vessel segmentation using ultra-widefield fundus photographs</article-title>
<alt-title alt-title-type="left-running-head">Xie et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fcell.2024.1532228">10.3389/fcell.2024.1532228</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Xie</surname>
<given-names>Qihang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2900816/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Li</surname>
<given-names>Xuefei</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Yuanyuan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Lu</surname>
<given-names>Jiayi</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ma</surname>
<given-names>Shaodong</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Zhao</surname>
<given-names>Yitian</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1362172/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Zhang</surname>
<given-names>Jiong</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/933502/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Cixi Biomedical Research Institute</institution>, <institution>Wenzhou Medical University</institution>, <addr-line>Ningbo</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Laboratory of Advanced Theranostic Materials and Technology</institution>, <institution>Ningbo Institute of Materials Technology and Engineering</institution>, <institution>Chinese Academy of Sciences</institution>, <addr-line>Ningbo</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1439952/overview">Weihua Yang</ext-link>, Jinan University, China</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1664666/overview">Fei Shi</ext-link>, Soochow University, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2240043/overview">Lei Xie</ext-link>, Zhejiang University of Technology, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2562809/overview">Hongming Xu</ext-link>, Dalian University of Technology, China</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Jiong Zhang, <email>jiong.zhang@ieee.org</email>; Yitian Zhao, <email>yitian.zhao@nimte.ac.cn</email>
</corresp>
<fn fn-type="equal" id="fn001">
<label>
<sup>&#x2020;</sup>
</label>
<p>These authors have contributed equally to this work and share first authorship</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>08</day>
<month>01</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>12</volume>
<elocation-id>1532228</elocation-id>
<history>
<date date-type="received">
<day>21</day>
<month>11</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>20</day>
<month>12</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Xie, Li, Li, Lu, Ma, Zhao and Zhang.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Xie, Li, Li, Lu, Ma, Zhao and Zhang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Background</title>
<p>Vessel segmentation in fundus photography has become a cornerstone technique for disease analysis. Within this field, Ultra-WideField (UWF) fundus images offer distinct advantages, including an expansive imaging range, detailed lesion data, and minimal adverse effects. However, the high resolution and low contrast inherent to UWF fundus images present significant challenges for accurate segmentation using deep learning methods, thereby complicating disease analysis in this context.</p>
</sec>
<sec>
<title>Methods</title>
<p>To address these issues, this study introduces M3B-Net, a novel multi-modal, multi-branch framework that leverages fundus fluorescence angiography (FFA) images to improve retinal vessel segmentation in UWF fundus images. Specifically, M3B-Net tackles the low segmentation accuracy caused by the inherently low contrast of UWF fundus images. Additionally, we propose an enhanced UWF-based segmentation network in M3B-Net, specifically designed to improve the segmentation of fine retinal vessels. The segmentation network includes the Selective Fusion Module (SFM), which enhances feature extraction within the segmentation network by integrating features generated during the FFA imaging process. To further address the challenges of high-resolution UWF fundus images, we introduce a Local Perception Fusion Module (LPFM) to mitigate context loss during the segmentation cut-patch process. Complementing this, the Attention-Guided Upsampling Module (AUM) enhances segmentation performance through convolution operations guided by attention mechanisms.</p>
</sec>
<sec>
<title>Results</title>
<p>Extensive experimental evaluations demonstrate that our approach significantly outperforms existing state-of-the-art methods for UWF fundus image segmentation.</p>
</sec>
</abstract>
<kwd-group>
<kwd>ultra-widefield</kwd>
<kwd>fundus fluorescence angiography</kwd>
<kwd>retinal vessel segmentation</kwd>
<kwd>multimodal framework</kwd>
<kwd>selective fusion</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Molecular and Cellular Pathology</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Clinical studies have demonstrated that alterations in the morphology of fundus blood vessels are closely associated with the progression of ocular diseases. By analyzing these vascular changes, physicians can diagnose and evaluate the severity and nature of various eye conditions. Ultra-WideField (UWF) imaging, an advanced form of fundus imaging, has emerged as a critical tool for disease analysis. With its expansive 200-degree field of view, UWF imaging provides a significantly broader depiction of vascular and disease-related features compared to conventional color fundus imaging, which is typically limited to a 45-degree range. Fundus fluorescein angiography (FFA) images are regarded as the gold standard for clinical vascular detection due to their superior contrast and precise diagnostic information. However, FFA imaging is invasive and carries potential side effects, limiting its broader applicability. In contrast, UWF imaging is a non-invasive modality that offers high-resolution visualization of fundus structures across a panoramic field of view exceeding 200&#xb0;. This technology enables detailed detection and analysis of peripheral retinal vessels and focal areas of pathology, such as those seen in diabetic retinopathy and venous obstruction. UWF fundus imaging excels in capturing intricate views of peripheral retinal vessels and lesions, providing rich pathological information that significantly enhances clinical analysis (<xref ref-type="bibr" rid="B23">Nguyen et al., 2024</xref>; <xref ref-type="bibr" rid="B19">Liu et al., 2023</xref>; <xref ref-type="bibr" rid="B2">Chen et al., 2023</xref>; <xref ref-type="bibr" rid="B46">Zhang et al., 2021</xref>). In computational fundus image analysis, vascular segmentation stands out as a foundational and extensively studied task. Accurate delineation of fundus vascular structures is essential, serving as a prerequisite for effective disease diagnosis and assessment (<xref ref-type="bibr" rid="B43">Yang et al., 2023</xref>).</p>
<p>Over the past decade, significant progress has been made in fundus vessel segmentation, driven by advancements in filtering (<xref ref-type="bibr" rid="B45">Zhang et al., 2016</xref>; <xref ref-type="bibr" rid="B32">Soares et al., 2006</xref>; <xref ref-type="bibr" rid="B21">Memari et al., 2017</xref>), morphological (<xref ref-type="bibr" rid="B8">Fraz et al., 2013</xref>; <xref ref-type="bibr" rid="B14">Imani et al., 2015</xref>; <xref ref-type="bibr" rid="B17">Kumar and Ravichandran, 2017</xref>), statistical (<xref ref-type="bibr" rid="B26">Orlando et al., 2016</xref>; <xref ref-type="bibr" rid="B44">Yin et al., 2012</xref>; <xref ref-type="bibr" rid="B24">Oliveira et al., 2018</xref>), and deep learning algorithms (<xref ref-type="bibr" rid="B40">Wu et al., 2018</xref>; <xref ref-type="bibr" rid="B42">Yan et al., 2018</xref>; <xref ref-type="bibr" rid="B29">Ryu et al., 2023</xref>). Among these, deep learning techniques have demonstrated particularly remarkable potential in medical image processing. The Key contributions include the window-based and sliding window approaches for neural cell membrane segmentation in microscopy images proposed by <xref ref-type="bibr" rid="B4">Ciresan et al. (2012)</xref>, and the integration of multi-scale 3D Convolutional Neural Networks (CNNs) with Conditional Random Fields (CRFs) for brain lesion segmentation presented by <xref ref-type="bibr" rid="B16">Kamnitsas et al. (2017)</xref>. The introduction of end-to-end Fully Convolutional Networks (FCNs) (<xref ref-type="bibr" rid="B20">Long et al., 2015</xref>) marked a transformative milestone in biomedical image segmentation. Among these, U-Net, an iconic encoder-decoder architecture introduced by <xref ref-type="bibr" rid="B28">Ronneberger et al. (2015)</xref>, has gained widespread recognition for its ability to effectively integrate multi-resolution features. U-Net&#x2019;s superior performance in medical image segmentation has spurred the development of numerous refined iterations and enhanced versions (<xref ref-type="bibr" rid="B9">Fu et al., 2016</xref>; <xref ref-type="bibr" rid="B10">Gibson et al., 2018</xref>). To further improve segmentation performance, several multi-stage models have been proposed. For instance (<xref ref-type="bibr" rid="B42">Yan et al., 2018</xref>), developed a three-stage deep learning model for fundus blood vessel segmentation. Additionally, weakly supervised and semi-supervised approaches have been explored to address the challenge of sparsely labeled medical image data (<xref ref-type="bibr" rid="B27">Perone and Cohen-Adad, 2018</xref>). extended the Mean Teacher method for MRI segmentation, while (<xref ref-type="bibr" rid="B30">Seeb&#xf6;ck et al., 2019</xref>) proposed a Bayesian U-Net for abnormality detection in OCT image segmentation. Despite these advancements, challenges such as segmentation inaccuracies and limited adaptability persist. Moreover, relatively few studies have focused on Ultra-WideField imaging modalities, underscoring the need for further exploration in this domain.</p>
<p>Compared to color fundus images, limited research has focused on the extraction of integrated vascular structures in Ultra-WideField (UWF) fundus images. There has been research focused on the analysis and diagnosis of ophthalmic diseases based on UWF images (<xref ref-type="bibr" rid="B33">Tang et al., 2024</xref>; <xref ref-type="bibr" rid="B5">Deng et al., 2024</xref>; <xref ref-type="bibr" rid="B35">Wan et al., 2024</xref>) proposed a new segmentation algorithm for peripapillary atrophy and optic disk from UWF Photographs (<xref ref-type="bibr" rid="B7">Ding et al., 2020</xref>). introduced a deep-learning framework for efficient vascular detection in UWF fundus photography (<xref ref-type="bibr" rid="B25">Ong et al., 2023</xref>). employed U-Net (<xref ref-type="bibr" rid="B28">Ronneberger et al., 2015</xref>) to segment UWF fundus images for recognizing lesions associated with retinal vein occlusion. Recently (<xref ref-type="bibr" rid="B37">Wang et al., 2024</xref>), developed a pioneering framework utilizing a patch-based active domain adaptation approach to enhance vessel segmentation in UWF-SLO images by selectively identifying valuable image patches. Additionally, they constructed and annotated the first multi-center UWF-SLO vessel segmentation dataset, incorporating data from multiple institutions to advance research in this area. Similarly (<xref ref-type="bibr" rid="B39">Wu et al., 2024</xref>), released the first publicly available UWF retinal hemorrhage segmentation dataset and proposed a subtraction network specifically for UWF retinal hemorrhage segmentation (<xref ref-type="bibr" rid="B15">Ju et al., 2021</xref>). explored a modified Cycle Generative Adversarial Network (CycleGAN) (<xref ref-type="bibr" rid="B47">Zhu et al., 2017</xref>) to bridge the domain gap between standard and UWF fundus images, facilitating the training of UWF fundus diagnosis models. Despite these advancements, feature extraction for UWF fundus images remains underdeveloped, and the accuracy of blood vessel segmentation in UWF fundus images requires further improvement.</p>
<p>The study of blood vessel segmentation in UWF fundus images presents several complex challenges. Firstly, one of the primary challenges is the complex backgrounds and uneven illumination characteristic of UWF fundus images, which result in low contrast between blood vessels and surrounding tissue, making feature extraction more difficult. In contrast, Fundus Fluorescence Angiography (FFA) images offer substantially higher contrast for blood vessels, enabling more precise extraction of vascular features. This distinction highlights the potential of using FFA images as high-quality references to improve the accuracy of vascular feature extraction in UWF fundus images. In this context, style transfer&#x2014;an unsupervised image generation technique&#x2014;has emerged as a powerful tool for image style conversion and enhancement. Owing to its flexibility and effectiveness, style transfer algorithms are increasingly employed across a range of multimodal medical imaging tasks.</p>
<p>For example (<xref ref-type="bibr" rid="B34">Tavakkoli et al., 2020</xref>), introduced a deep learning conditional GAN capable of generating FFA images from fundus photographs. Their proposed GAN produced anatomically accurate angiograms with fidelity comparable to FFA images, significantly outperforming two state-of-the-art generative algorithms. Similarly (<xref ref-type="bibr" rid="B15">Ju et al., 2021</xref>), employed an enhanced CycleGAN (<xref ref-type="bibr" rid="B47">Zhu et al., 2017</xref>) to facilitate modal shifts between standard fundus images and UWF fundus images, effectively generating additional UWF fundus images for training purposes. This approach addressed challenges related to data scarcity and annotation. Inspired by these advancements in leveraging style transfer for downstream tasks, our research explores cross-modality-assisted feature extraction in UWF fundus images using style transfer models. Specifically, this thesis proposes a style transfer model to optimize the extraction of critical blood vessel features during the conversion from UWF to FFA images. This methodology aims to enhance the accuracy of retinal vessel segmentation in UWF fundus images.</p>
<p>Feature selection involves eliminating redundant or irrelevant features from a set of extracted features to improve performance. Recent advancements in image super-resolution have showcased the enhancement of low-resolution (LR) images by aligning LR and reference images in the feature space and fusing them using deep architectures. For instance (<xref ref-type="bibr" rid="B36">Wan et al., 2022</xref>), proposed a novel ternary translation network that transforms aged and pristine photos into a shared latent space. Pairwise learning is employed to translate between these latent spaces, generating quality-enhanced photos. Furthermore, several studies have utilized semantic consistency across diverse images as a form of bootstrapping during training, achieved by computing feature similarity (<xref ref-type="bibr" rid="B38">Wu et al., 2023</xref>). Inspired by these advancements, we explore search matching within the feature space for feature selection in a multi-stream framework. By identifying key features in UWF fundus images within the segmentation network, our approach achieves more precise segmentation of low-contrast retinal vessels.</p>
<p>Secondly, in addition to the challenge of low contrast, the high-resolution nature of UWF imaging poses a significant limitation to segmentation accuracy. Computational constraints have led many recent studies to adopt a patch-based approach for segmenting images (<xref ref-type="bibr" rid="B37">Wang et al., 2024</xref>). However, this method often disregards the interaction between local patches and the global context, resulting in segmentation inaccuracies, particularly in delineating edge details. To address this limitation, recent research has advocated for combining global and local features through multi-stream networks to enhance contextual awareness. These approaches have successfully mitigated the loss of contextual information inherent in patch-based segmentation methods. Building on these advancements, we propose incorporating a local-aware context module into the retinal vessel segmentation network for UWF images. This module aims to overcome the issue of blood vessel fragmentation by effectively integrating global and local information, thereby improving segmentation accuracy for high-resolution UWF fundus images.</p>
<p>Our contributions are summarized as follows:<list list-type="simple">
<list-item>
<p>
<inline-formula id="inf1">
<mml:math id="m1">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> We propose a multi-modal, multi-branch framework, named M3B-Net, which is based on a style transfer strategy. This framework leverages the conversion of UWF fundus images to FFA images to enhance segmentation tasks for UWF fundus images. M3B-Net comprises two primary components: a style transfer network and a segmentation network.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf2">
<mml:math id="m2">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> we incorporate a Selective Fusion Module (SFM) into the segmentation network to address the challenges of low contrast in UWF image segmentation. The SFM performs feature space matching to extract key features in the latent space, mitigating issues such as blood vessel fragmentation.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf3">
<mml:math id="m3">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> We introduce a multi-scale local perception fusion module (LPFM) into the segmentation network according to the high-resolution nature of UWF fundus images. This module enhances the network&#x2019;s ability to discern contextual information effectively.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf4">
<mml:math id="m4">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> We propose a multi-level attention upsampling module (AUM) to improve the segmentation of fine blood vessels. This module aims to mitigate feature loss during the upsampling process, enabling more precise segmentation of delicate vascular sr &#x3d; tryctures in UWF fundus images.</p>
</list-item>
</list>
</p>
</sec>
<sec sec-type="methods" id="s2">
<title>2 Methods</title>
<sec id="s2-1">
<title>2.1 Dataset</title>
<p>In this work, we validate the efficacy of our method using two datasets: a proprietary dataset and the publicly available PRIME-FP20 dataset (<xref ref-type="bibr" rid="B7">Ding et al., 2020</xref>).<list list-type="simple">
<list-item>
<p>
<inline-formula id="inf5">
<mml:math id="m5">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> The private dataset used in this study was collected at Ningbo Yinzhou People&#x2019;s Hospital. The fundus UWF image dataset was captured using an Ultra-WideField Laser Scanning Ophthalmoscope of Optos 200Tx with a resolution of <inline-formula id="inf6">
<mml:math id="m6">
<mml:mrow>
<mml:mn>3900</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>3072</mml:mn>
<mml:mo>.</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> The paired FFA images were obtained by a Heidelberg Spectralis HRA Instrument of the same unit, with a resolution of <inline-formula id="inf7">
<mml:math id="m7">
<mml:mrow>
<mml:mn>768</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>868</mml:mn>
<mml:mo>.</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> Based on this data, we constructed a UWF-FFA dataset (UWF-GAN) and a dataset for segmentation (UWF-SEG). The UWF-GAN dataset consists of 120 aligned UWF image patches and FFA image patches, which are intercepted and aligned from the paired whole UWF fundus images and FFA images. The UWF-SEG dataset comprises 65 UWF fundus images, each annotated with pixel-level vessel labels for evaluating segmentation performance. The vessel labels of the UWF fundus images were annotated by an experienced ophthalmologist using the Pair annotation tool. All images were collected with explicit patient consent, and we rigorously adhered to data security regulations by meticulously anonymizing all personal information to ensure patient privacy adequately. <xref ref-type="fig" rid="F1">Figure 1</xref> illustrates examples of the original UWF fundus images, the preprocessed UWF images, and the corresponding paired FFA image. We utilize histogram equalization to preprocess UWF fundus images, effectively highlighting the vascular structures. Both our method and the comparison methods use the preprocessed images as input.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf8">
<mml:math id="m8">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> The PRIME-FP20 dataset was designed to support the development and evaluation of retinal vessel segmentation algorithms for UWF fundus images. It contains 15 high-resolution UWF fundus images acquired using the Optos 200Tx camera (Optos plc, Dunfermline, United Kingdom). Each image is paired with a labeled binarized vascular map and a binarized mask that delineates the effective data area within the image. Additionally, a corresponding FFA image was simultaneously captured for each UWF fundus image. All images in the dataset feature a resolution of <inline-formula id="inf9">
<mml:math id="m9">
<mml:mrow>
<mml:mn>4000</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>4000</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> pixels.</p>
</list-item>
</list>
</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>
<bold>(A)</bold> Original UWF image. <bold>(B)</bold> Preprocessed UWF image. <bold>(C)</bold> FFA image paired with the UWF image.</p>
</caption>
<graphic xlink:href="fcell-12-1532228-g001.tif"/>
</fig>
</sec>
<sec id="s2-2">
<title>2.2 Framework overview</title>
<p>The proposed framework is illustrated in <xref ref-type="fig" rid="F2">Figure 2</xref>, comprising two main components: a segmentation network for UWF fundus images and a style transfer network that generates FFA images from UWF fundus images. The segmentation network includes an encoder with a Local Perception Fusion Module (LPFM), a Selective Fusion Module (SFM), a decoder equipped with a Multi-level Attention Upsampling Module (AUM), and an auxiliary tiny encoder-decoder structure. Meanwhile, the style transfer network utilizes a CycleGAN-based architecture (<xref ref-type="bibr" rid="B47">Zhu et al., 2017</xref>).</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>The proposed framework M3B-Net for blood vessel segmentation in UWF fundus images.</p>
</caption>
<graphic xlink:href="fcell-12-1532228-g002.tif"/>
</fig>
<p>Our method consists of four stages. Stage 1: Use small patches to pre-train a transfer network to obtain FFA features. Stage 2: Use middle patches to pre-train an encoder, aiming to reduce computational overhead during segmentation network training. Stage 3: Similarly, large patches are used to pre-train a large-scale encoder. Stage 4: Freeze the network parameters from the first three stages and begin training the entire segmentation network. In the fourth stage, UWF fundus images <inline-formula id="inf10">
<mml:math id="m10">
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> from the dataset are simultaneously fed into both the segmentation network and the style transfer network initially. In the segmentation network, the LPFM processes the UWF images, extracting a feature map <inline-formula id="inf11">
<mml:math id="m11">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. This feature map is passed through the decoder with the multi-level AUM and subsequently processed by a compact U-shaped network to produce the final blood vessel segmentation results. Concurrently, in the CycleGAN-based style transfer network, the UWF images undergo encoding and decoding, resulting in another feature map <inline-formula id="inf12">
<mml:math id="m12">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. During the training phase, <inline-formula id="inf13">
<mml:math id="m13">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf14">
<mml:math id="m14">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are subjected to a search and matching process via the SFM, which aligns the feature maps from both networks. This alignment establishes a correspondence between the UWF and FFA images. Supervision for both networks is provided through a loss function based on paired UWF and FFA image biplets. The SFM filters the most relevant <inline-formula id="inf15">
<mml:math id="m15">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, which is subsequently fed into the downstream segmentation framework. The following sections provide detailed descriptions of the vessel segmentation network, the Selective Fusion Module, and the Multi-level Attention Upsampling Module.</p>
</sec>
<sec id="s2-3">
<title>2.3 Vessel segmentation network</title>
<p>The large size of UWF fundus images presents a challenge in balancing segmentation accuracy and computational efficiency for blood vessel segmentation networks. Traditional methods, such as down-sampling, patch cropping, and cascade modeling, struggle to achieve this balance effectively. In this paper, we propose an innovative cropping strategy to address this issue. We utilize an efficient approach by randomly extracting smaller patches from the original UWF image (size <inline-formula id="inf16">
<mml:math id="m16">
<mml:mrow>
<mml:mn>3900</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>3072</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>), resulting in patches of size <inline-formula id="inf17">
<mml:math id="m17">
<mml:mrow>
<mml:mn>256</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>256</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>, referred to as &#x2018;small patches&#x2019;. From these small patches, we generate medium and large patches with dimensions of <inline-formula id="inf18">
<mml:math id="m18">
<mml:mrow>
<mml:mn>512</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>512</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf19">
<mml:math id="m19">
<mml:mrow>
<mml:mn>768</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>768</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>, respectively. Centered on the small patch, we expand it by a factor of two to obtain a middle patch of <inline-formula id="inf20">
<mml:math id="m20">
<mml:mrow>
<mml:mn>512</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>512</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>, and similarly, expand it by a factor of three to obtain a large patch of <inline-formula id="inf21">
<mml:math id="m21">
<mml:mrow>
<mml:mn>768</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>768</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>. All three patch sizes are then resized to a uniform size of <inline-formula id="inf22">
<mml:math id="m22">
<mml:mrow>
<mml:mn>256</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>256</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> and simultaneously input into three ResNet (<xref ref-type="bibr" rid="B13">He et al., 2016</xref>) feature extractors. The feature extractors for the medium and large patches are pre-trained, and their parameters are fixed during the segmentation process. This results in three distinct sets of feature maps corresponding to different scales.</p>
<p>After that, we apply the Local Perception Fusion Module (LPFM) to enhance the contextual positional features of the small patches across different scales. The process of the LPFM is illustrated in <xref ref-type="fig" rid="F3">Figure 3</xref>. First, we compute the inner products between the small patch and both the medium and large patches, obtaining attention maps through softmax activation. These attention maps are then used to generate new feature maps by performing inner product operations with the small patches. The resulting feature maps are regularized, and their weights are reassigned before being fused to form the final feature vector. Finally, these fused results are passed through the Selective Fusion Module (SFM), followed by the decoder and a small U-Net, to generate the final vessel binary mask.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>The details of the local perception fusion module framework.</p>
</caption>
<graphic xlink:href="fcell-12-1532228-g003.tif"/>
</fig>
<p>In the subsequent sections, we introduce the specifics of the selective fusion module and the multi-level attention upsampling module, which constitute components of the proposed segmentation network.</p>
</sec>
<sec id="s2-4">
<title>2.4 Selective fusion module</title>
<p>The details of the module are displayed in <xref ref-type="fig" rid="F2">Figure 2</xref>. As a crucial component for linking the two feature maps generated by the segmentation network and style transfer network, the SFM is based on knowledge related to feature engineering. Specifically, we propose to select FFA features to replace the broken blood vessel features ensuring that redundant information does not negatively impact segmentation performance. Initially, the network calculates the similarity between the feature map <inline-formula id="inf23">
<mml:math id="m23">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> output from the encoder of the segmentation network and the feature map <inline-formula id="inf24">
<mml:math id="m24">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> output from the encoder of the style transfer network. The similarity is computed using the Euclidean distance, as shown in <xref ref-type="disp-formula" rid="e1">Equation 1</xref> below:<disp-formula id="e1">
<mml:math id="m25">
<mml:mrow>
<mml:mi>d</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:munderover>
</mml:mstyle>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:math>
<label>(1)</label>
</disp-formula>
</p>
<p>Where <inline-formula id="inf25">
<mml:math id="m26">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf26">
<mml:math id="m27">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> denote the pixel values of the two feature maps, respectively, and <inline-formula id="inf27">
<mml:math id="m28">
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> denotes the number of pixels of the feature maps. It is worth noticing that the images in this study are rich in information, and based on the limitation of computational resources and time cost, this study carries out partial sampling computation on the feature maps for local similarity comparison. We set a threshold and range of 0.5 to confirm the strength of similarity. Eventually, SFM will fuse the feature map <inline-formula id="inf28">
<mml:math id="m29">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> with high similarity to the feature map <inline-formula id="inf29">
<mml:math id="m30">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> to generate the fusion feature <inline-formula id="inf30">
<mml:math id="m31">
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>. If the similarity between the two feature maps is low, it indicates that <inline-formula id="inf31">
<mml:math id="m32">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> does not provide more valuable information for vessel segmentation, and only <inline-formula id="inf32">
<mml:math id="m33">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is passed to the subsequent network layers.</p>
<p>Following the selection and fusion operations, multi-modal information is introduced in this study, which provides higher recognisability for retinal blood vessel segmentation. Additionally, similarity calculation and screening also avoid the interference of irrelevant features on the network when generating FFA images.</p>
</sec>
<sec id="s2-5">
<title>2.5 Multi-level attention upsampling module</title>
<p>As shown in <xref ref-type="fig" rid="F4">Figure 4</xref>, this module is designed to address the issue of vascular information loss during upsampling. The multi-level AUM primarily comprises two compact double convolutional blocks, denoted as <inline-formula id="inf33">
<mml:math id="m34">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>E</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf34">
<mml:math id="m35">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>E</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, which utilize an attention mechanism to capture feature representations at different levels. First, the feature map <inline-formula id="inf35">
<mml:math id="m36">
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> generated by the SFM is input into <inline-formula id="inf36">
<mml:math id="m37">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>E</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, the detailed architecture of which is depicted in <xref ref-type="fig" rid="F4">Figure 4</xref>. <inline-formula id="inf37">
<mml:math id="m38">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>E</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> comprises two convolutional paths of different scales: path <inline-formula id="inf38">
<mml:math id="m39">
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> serves as the primary path and encompasses two <inline-formula id="inf39">
<mml:math id="m40">
<mml:mrow>
<mml:mn>7</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>7</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> convolutional layers, while path <inline-formula id="inf40">
<mml:math id="m41">
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> consists of a single <inline-formula id="inf41">
<mml:math id="m42">
<mml:mrow>
<mml:mn>7</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>7</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> convolutional layer. After the feature map <inline-formula id="inf42">
<mml:math id="m43">
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> passes through path <inline-formula id="inf43">
<mml:math id="m44">
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> and path <inline-formula id="inf44">
<mml:math id="m45">
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, two feature maps <inline-formula id="inf45">
<mml:math id="m46">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf46">
<mml:math id="m47">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are obtained. We calculate the attention weight <inline-formula id="inf47">
<mml:math id="m48">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> of <inline-formula id="inf48">
<mml:math id="m49">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> with respect to <inline-formula id="inf49">
<mml:math id="m50">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> by employing <inline-formula id="inf50">
<mml:math id="m51">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> as the query<inline-formula id="inf51">
<mml:math id="m52">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>Q</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>, key<inline-formula id="inf52">
<mml:math id="m53">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>K</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf53">
<mml:math id="m54">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> as value <inline-formula id="inf54">
<mml:math id="m55">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>V</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>. Subsequently, we perform element-wise multiplication between <inline-formula id="inf55">
<mml:math id="m56">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and the weight <inline-formula id="inf56">
<mml:math id="m57">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, and fuse the product with <inline-formula id="inf57">
<mml:math id="m58">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>a</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> to acquire the upsampling result, integrating feature information across diverse scales. This result is then forwarded to <inline-formula id="inf58">
<mml:math id="m59">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>E</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, the structure of which is illustrated in <xref ref-type="fig" rid="F4">Figure 4</xref>. <inline-formula id="inf59">
<mml:math id="m60">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>E</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> closely resembles the architecture of <inline-formula id="inf60">
<mml:math id="m61">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>E</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, with the key difference being the scale of convolution operations. Similar to <inline-formula id="inf61">
<mml:math id="m62">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>E</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula id="inf62">
<mml:math id="m63">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>E</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> comprises two convolutional paths <inline-formula id="inf63">
<mml:math id="m64">
<mml:mrow>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf64">
<mml:math id="m65">
<mml:mrow>
<mml:mi>d</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, with path <inline-formula id="inf65">
<mml:math id="m66">
<mml:mrow>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> serving as the primary path. After passing through both paths, we obtain two distinct feature maps, denoted as <inline-formula id="inf66">
<mml:math id="m67">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf67">
<mml:math id="m68">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>d</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. Subsequently, these feature maps undergo attention computation and fusion steps to yield the decoded result. The process is represented by <xref ref-type="disp-formula" rid="e2">Equations 2</xref>&#x2013;<xref ref-type="disp-formula" rid="e5">5</xref>:<disp-formula id="e2">
<mml:math id="m69">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mtext mathvariant="italic">Att</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
<label>(2)</label>
</disp-formula>
<disp-formula id="e3">
<mml:math id="m70">
<mml:mrow>
<mml:mi>O</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>u</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
<label>(3)</label>
</disp-formula>
<disp-formula id="e4">
<mml:math id="m71">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mtext mathvariant="italic">Att</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>5</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>O</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>u</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>5</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>O</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>u</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
<label>(4)</label>
</disp-formula>
<disp-formula id="e5">
<mml:math id="m72">
<mml:mrow>
<mml:mi>O</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>t</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>5</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>O</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>u</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
<label>(5)</label>
</disp-formula>
</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>The details of the multi-level attention upsampling module.</p>
</caption>
<graphic xlink:href="fcell-12-1532228-g004.tif"/>
</fig>
<p>Where <inline-formula id="inf68">
<mml:math id="m73">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula id="inf69">
<mml:math id="m74">
<mml:mrow>
<mml:mi>O</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>u</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, and <inline-formula id="inf70">
<mml:math id="m75">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are the intermediate values computed by the module for the feature map. <inline-formula id="inf71">
<mml:math id="m76">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf72">
<mml:math id="m77">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> represent attention weight, while <inline-formula id="inf73">
<mml:math id="m78">
<mml:mrow>
<mml:mi>O</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>u</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> represents the output of <inline-formula id="inf74">
<mml:math id="m79">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>E</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. <inline-formula id="inf75">
<mml:math id="m80">
<mml:mrow>
<mml:mi>O</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> refers to the final output of the module, and <inline-formula id="inf76">
<mml:math id="m81">
<mml:mrow>
<mml:mtext mathvariant="italic">Attn</mml:mtext>
</mml:mrow>
</mml:math>
</inline-formula> represents the attention mechanism. <inline-formula id="inf77">
<mml:math id="m82">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula id="inf78">
<mml:math id="m83">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula id="inf79">
<mml:math id="m84">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula id="inf80">
<mml:math id="m85">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula id="inf81">
<mml:math id="m86">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>5</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> correspond five different convolutional layers.</p>
<p>By employing multi-scale convolutions and integrating an attention mechanism, this study enhances retinal blood vessel segmentation with improved structural comprehensiveness. The module excels at fusing feature information across different scales, thereby reducing information loss and omissions during the upsampling process. As a result, it more effectively addresses the challenge of incomplete segmentation of fine retinal blood vessels in UWF fundus images.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>3 Results</title>
<sec id="s3-1">
<title>3.1 Implementation details</title>
<p>In the experiment, UWF fundus images are preprocessed using the contrast adaptive histogram equalization method to enhance the contrast of the images. The UWF-SEG dataset contains a total of 65 images, with 20 images allocated to the test set and the remaining 45 images utilized for training purposes. The PRIME-FP20 dataset consists of 15 images, with 10 images used for training and the remaining 5 images for testing. To ensure consistency, all images are resized to dimensions of <inline-formula id="inf82">
<mml:math id="m87">
<mml:mrow>
<mml:mn>1024</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1024</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> pixels, with small patches resized to <inline-formula id="inf83">
<mml:math id="m88">
<mml:mrow>
<mml:mn>256</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>256</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> pixels. Data augmentation techniques, including random flipping and rotation, are applied during the experiments. The training process spans 200 epochs, enabling the model to converge and effectively capture underlying patterns within the data.</p>
<p>In the experimentation of the proposed method, the model was implemented using PyTorch 3.8 and trained on a workstation equipped with four NVIDIA GeForce RTX 3090 GPUs. A batch size of 5 was used for the UWF-SEG dataset, and 2 for the PRIME-FP20 dataset throughout the training process. The initial learning rate for the vascular segmentation network was set to 0.0004, with a weight decay rate of 0.0005. The Adam optimizer was employed for gradient updates.</p>
</sec>
<sec id="s3-2">
<title>3.2 Evaluation metrics</title>
<p>To evaluate the performance of the proposed retinal vessel segmentation method, four widely adopted metrics are used in this work, namely,: the Dice Similarity Coefficient (Dice), Sensitivity (Sen), and Balanced Accuracy (BACC). In the evaluation of the method, the sigmoid function was used as the activation function for the final output, and the confusion matrix was calculated (comprising True Positives (TP), False Positives (FP), True Negatives (TN), and False Negatives (FN)) to evaluate the accuracy of the method. The relevant formulas and their significance are as follows:<list list-type="simple">
<list-item>
<p>
<inline-formula id="inf84">
<mml:math id="m89">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> Dice Similarity Coefficient (Dice) &#x3d; 2 <inline-formula id="inf85">
<mml:math id="m90">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> TP/(2 <inline-formula id="inf86">
<mml:math id="m91">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> TP &#x2b; FP &#x2b; FN).</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf87">
<mml:math id="m92">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> Sensitivity (SEN) &#x3d; TP/(TP &#x2b; FN).</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf88">
<mml:math id="m93">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> True Positive Rate (TPR) &#x3d; TP/(TP &#x2b; FN).</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf89">
<mml:math id="m94">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> True egative Rate (TNR) &#x3d; TN/(FP &#x2b; TN).</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf90">
<mml:math id="m95">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> Balanced Accuracy (BACC) &#x3d; (TPR &#x2b; TNR)/2.</p>
</list-item>
</list>
</p>
<p>Where True Positives (TP) represent the number of samples correctly classified as positive, False Positives (FP) refer to samples incorrectly classified as positive, True Negatives (TN) are the samples correctly classified as negative, and False Negatives (FN) are the samples incorrectly predicted as negative when they should have been positive.</p>
</sec>
<sec id="s3-3">
<title>3.3 Comparison with state-of-the-art methods</title>
<p>A comprehensive series of comparative experiments were conducted in this section to demonstrate the effectiveness of the proposed method. These experiments included both quantitative and qualitative analyses, evaluating the performance on both public and private test sets. Several state-of-the-art approaches in fundus vessel segmentation were selected for comparison in this study, including CE-Net (<xref ref-type="bibr" rid="B11">Gu et al., 2019</xref>), CS-Net (<xref ref-type="bibr" rid="B22">Mou et al., 2021</xref>), TransUnet (<xref ref-type="bibr" rid="B3">Chen et al., 2021</xref>), SwinUnet (<xref ref-type="bibr" rid="B1">Cao et al., 2022</xref>), U-Net (<xref ref-type="bibr" rid="B28">Ronneberger et al., 2015</xref>), ResUnet (<xref ref-type="bibr" rid="B41">Xiao et al., 2018</xref>) and ConvUNext (<xref ref-type="bibr" rid="B12">Han et al., 2022</xref>). All these methods have demonstrated superior performance in fundus image analysis. To ensure the fairness of the experiments, identical image preprocessing and cropping techniques were applied across all methods, and the datasets were divided into the same training test sets.</p>
</sec>
<sec id="s3-4">
<title>3.4 Performance of vessel segmentation on the private dataset UWF-SEG</title>
<p>The metrics analysis shows that the proposed method outperforms other methods in terms of the effectiveness of retinal blood vessel segmentation in UWF fundus images. Specifically, the M3B-Net method presented in this chapter surpasses other methods across all evaluated metrics (Dice, Sen, and BACC) as demonstrated in <xref ref-type="table" rid="T1">Table 1</xref>. For example, on the private UWF-SEG dataset, our method achieves improvements of approximately 5.19%, 3.35%, and 1.60% in Dice, Sensitivity, and BACC, respectively, compared to the ConvUNext model (<xref ref-type="bibr" rid="B12">Han et al., 2022</xref>). Additionally, our method provides more detailed vascular information, facilitating a finer observation of the retinal vessels. This improvement is primarily attributed to the proposed framework&#x2019;s focus on enhancing the vascular signal while minimizing the influence of background noise during the reconstruction process.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>The vessel segmentation results of different methods on UWF-SEG dataset and FRIME-FP20 datase<bold>t</bold>.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th colspan="1" align="left">Methods</th>
<th colspan="3" align="center">UWF-SEG</th>
<th colspan="3" align="center">FRIME-FP20</th>
</tr>
<tr>
<th align="left">&#xa0;</th>
<th align="center">
<italic>BACC(%)</italic> <inline-formula id="inf91">
<mml:math id="m96">
<mml:mrow>
<mml:mi>&#x2191;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</th>
<th align="center">
<italic>Sen(%)</italic> <inline-formula id="inf92">
<mml:math id="m97">
<mml:mrow>
<mml:mi>&#x2191;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</th>
<th align="center">
<italic>Dice(%)</italic> <inline-formula id="inf93">
<mml:math id="m98">
<mml:mrow>
<mml:mi>&#x2191;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</th>
<th align="center">
<italic>BACC(%)</italic> <inline-formula id="inf94">
<mml:math id="m99">
<mml:mrow>
<mml:mi>&#x2191;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</th>
<th align="center">
<italic>Sen(%)</italic> <inline-formula id="inf95">
<mml:math id="m100">
<mml:mrow>
<mml:mi>&#x2191;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</th>
<th align="center">
<italic>Dice(%)</italic> <inline-formula id="inf96">
<mml:math id="m101">
<mml:mrow>
<mml:mi>&#x2191;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">U-Net (<xref ref-type="bibr" rid="B28">Ronneberger et al., 2015</xref>)</td>
<td align="center">85.34 <inline-formula id="inf97">
<mml:math id="m102">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.22</td>
<td align="center">71.88 <inline-formula id="inf98">
<mml:math id="m103">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 2.62</td>
<td align="center">73.14 <inline-formula id="inf99">
<mml:math id="m104">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 0.82</td>
<td align="center">78.90 <inline-formula id="inf100">
<mml:math id="m105">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 3.03</td>
<td align="center">57.88 <inline-formula id="inf101">
<mml:math id="m106">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 6.08</td>
<td align="center">70.92 <inline-formula id="inf102">
<mml:math id="m107">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 4.73</td>
</tr>
<tr>
<td align="left">ResUnet (<xref ref-type="bibr" rid="B6">Diakogiannis et al., 2020</xref>)</td>
<td align="center">86.54 <inline-formula id="inf103">
<mml:math id="m108">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 0.90</td>
<td align="center">74.52 <inline-formula id="inf104">
<mml:math id="m109">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.71</td>
<td align="center">75.67 <inline-formula id="inf105">
<mml:math id="m110">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 0.68</td>
<td align="center">86.74 <inline-formula id="inf106">
<mml:math id="m111">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.21</td>
<td align="center">73.72 <inline-formula id="inf107">
<mml:math id="m112">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 2.43</td>
<td align="center">79.24 <inline-formula id="inf108">
<mml:math id="m113">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.93</td>
</tr>
<tr>
<td align="left">CE-Net (<xref ref-type="bibr" rid="B11">Gu et al., 2019</xref>)</td>
<td align="center">87.71 <inline-formula id="inf109">
<mml:math id="m114">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.66</td>
<td align="center">77.55 <inline-formula id="inf110">
<mml:math id="m115">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 3.35</td>
<td align="center">72.64 <inline-formula id="inf111">
<mml:math id="m116">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 0.55</td>
<td align="center">88.07 <inline-formula id="inf112">
<mml:math id="m117">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.02</td>
<td align="center">76.44 <inline-formula id="inf113">
<mml:math id="m118">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 2.06</td>
<td align="center">79.88 <inline-formula id="inf114">
<mml:math id="m119">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.65</td>
</tr>
<tr>
<td align="left">CS-Net (<xref ref-type="bibr" rid="B22">Mou et al., 2021</xref>)</td>
<td align="center">79.69 <inline-formula id="inf115">
<mml:math id="m120">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 3.66</td>
<td align="center">60.18 <inline-formula id="inf116">
<mml:math id="m121">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 7.54</td>
<td align="center">68.50 <inline-formula id="inf117">
<mml:math id="m122">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 5.54</td>
<td align="center">81.06 <inline-formula id="inf118">
<mml:math id="m123">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 2.87</td>
<td align="center">62.24 <inline-formula id="inf119">
<mml:math id="m124">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 5.76</td>
<td align="center">73.61 <inline-formula id="inf120">
<mml:math id="m125">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 4.49</td>
</tr>
<tr>
<td align="left">TransUnet (<xref ref-type="bibr" rid="B3">Chen et al., 2021</xref>)</td>
<td align="center">83.95 <inline-formula id="inf121">
<mml:math id="m126">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.64</td>
<td align="center">68.82 <inline-formula id="inf122">
<mml:math id="m127">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 3.39</td>
<td align="center">74.75 <inline-formula id="inf123">
<mml:math id="m128">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 0.76</td>
<td align="center">88.12 <inline-formula id="inf124">
<mml:math id="m129">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 0.85</td>
<td align="center">76.54 <inline-formula id="inf125">
<mml:math id="m130">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.72</td>
<td align="center">79.70 <inline-formula id="inf126">
<mml:math id="m131">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.37</td>
</tr>
<tr>
<td align="left">SwinUnet (<xref ref-type="bibr" rid="B1">Cao et al., 2022</xref>)</td>
<td align="center">85.24 <inline-formula id="inf127">
<mml:math id="m132">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.47</td>
<td align="center">71.80 <inline-formula id="inf128">
<mml:math id="m133">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 2.98</td>
<td align="center">73.64 <inline-formula id="inf129">
<mml:math id="m134">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 0.94</td>
<td align="center">81.65 <inline-formula id="inf130">
<mml:math id="m135">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.64</td>
<td align="center">63.78 <inline-formula id="inf131">
<mml:math id="m136">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 3.39</td>
<td align="center">68.74 <inline-formula id="inf132">
<mml:math id="m137">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.72</td>
</tr>
<tr>
<td align="left">ConvUNext (<xref ref-type="bibr" rid="B12">Han et al., 2022</xref>)</td>
<td align="center">88.67 <inline-formula id="inf133">
<mml:math id="m138">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.27</td>
<td align="center">79.10 <inline-formula id="inf134">
<mml:math id="m139">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 2.55</td>
<td align="center">73.35 <inline-formula id="inf135">
<mml:math id="m140">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 0.36</td>
<td align="center">91.99 <inline-formula id="inf136">
<mml:math id="m141">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.31</td>
<td align="center">84.65 <inline-formula id="inf137">
<mml:math id="m142">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 3.34</td>
<td align="center">78.06 <inline-formula id="inf138">
<mml:math id="m143">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.44</td>
</tr>
<tr>
<td align="left">Previously Proposed (<xref ref-type="bibr" rid="B18">Li et al., 2023</xref>)</td>
<td align="center">89.30 <inline-formula id="inf139">
<mml:math id="m144">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.22</td>
<td align="center">79.96 <inline-formula id="inf140">
<mml:math id="m145">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 2.57</td>
<td align="center">78.13 <inline-formula id="inf141">
<mml:math id="m146">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 0.73</td>
<td align="center">92.09 <inline-formula id="inf142">
<mml:math id="m147">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 0.59</td>
<td align="center">84.93 <inline-formula id="inf143">
<mml:math id="m148">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.25</td>
<td align="center">81.97 <inline-formula id="inf144">
<mml:math id="m149">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 0.82</td>
</tr>
<tr>
<td align="left">Ours</td>
<td align="center">
<bold>90.27</bold> <inline-formula id="inf145">
<mml:math id="m150">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <bold>1.87</bold>
</td>
<td align="center">
<bold>82.45</bold> <inline-formula id="inf146">
<mml:math id="m151">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <bold>3.80</bold>
</td>
<td align="center">
<bold>78.54</bold> <inline-formula id="inf147">
<mml:math id="m152">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <bold>0.44</bold>
</td>
<td align="center">
<bold>93.15</bold> <inline-formula id="inf148">
<mml:math id="m153">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <bold>0.73</bold>
</td>
<td align="center">
<bold>87.17</bold> <inline-formula id="inf149">
<mml:math id="m154">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <bold>1.53</bold>
</td>
<td align="center">
<bold>83.02</bold> <inline-formula id="inf150">
<mml:math id="m155">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <bold>0.70</bold>
</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>This significant performance improvement can be attributed to the proposed method&#x2019;s enhanced capability in segmenting fine retinal blood vessels in UWF fundus images. Specifically, the proposed method utilizes cross-modal image style transfer to achieve effective feature enhancement. During the learning process, the selective fusion module enables the segmentation network to select two feature maps based on correlation calculations, which significantly improves the recognition of fine retinal vessels. This approach mitigates the risk of information loss that can occur when directly applying enhancement techniques. Furthermore, given the wide imaging range of UWF fundus images, the study incorporates a local perceptual fusion module and a multi-level attention upsampling module. These modules ensure that global information is effectively integrated during the encoding process while minimizing the loss of vascular details during the decoding stage.</p>
<p>As shown in <xref ref-type="fig" rid="F5">Figure 5</xref>, the original image from the private UWF-SEG dataset, along with the segmentation results from our method and other comparative approaches, are presented. From the figure, it is evident that TransUnet (<xref ref-type="bibr" rid="B3">Chen et al., 2021</xref>), a network structure based on the attention mechanism, is better at capturing both local and global feature relationships than traditional convolutional neural networks. However, the segmentation results exhibit obvious under-segmentation, which indicates that it is more seriously affected by the artifacts and lesion areas in the UWF images during the segmentation process. Additionally, other comparative methods show obvious vessel breaks and unrecognized small vessel ends in the segmentation results. In contrast, our method can more effectively identify the small vessels in UWF fundus images, reducing under-segmentation while also mitigating the over-segmentation issues, as highlighted in the orange boxes in <xref ref-type="fig" rid="F5">Figure 5</xref>.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Vessel segmentation results of UWF fundus images by different methods on UWF-SEG dataset, where the white, green, and red represent true positive, false negative, and false positive, respectively.</p>
</caption>
<graphic xlink:href="fcell-12-1532228-g005.tif"/>
</fig>
</sec>
<sec id="s3-5">
<title>3.5 Performance of vessel segmentation on the PRIME-FP20</title>
<p>Similar to the experimental evaluation metrics for the private dataset, this study also conducts both quantitative and qualitative analyses of all methods on the public PRIME-FP20 dataset. As shown in <xref ref-type="table" rid="T1">Table 1</xref>, a comparison of the experimental results from our method and other segmentation approaches on the public dataset demonstrates the superior performance of our method. Specifically, on the PRIME-FP20 dataset, our method shows a 3.14% improvement in the Dice score compared to CE-Net (<xref ref-type="bibr" rid="B11">Gu et al., 2019</xref>) and outperforms the ConvUNext (<xref ref-type="bibr" rid="B12">Han et al., 2022</xref>) by 2.52% in SEN and 1.16% in BACC. These results highlight the effectiveness of our method. Furthermore, our method performs better on the public dataset than on the private dataset, primarily due to the segmentation challenges introduced by lesion regions in the private dataset.</p>
<p>Additionally, we present both the over-segmentation and under-segmentation results of our proposed method and other comparative methods in <xref ref-type="fig" rid="F6">Figure 6</xref>. It is evident that our method is more effective in recognizing fine vessels and vessels in low-contrast regions. As shown in the orange boxes of <xref ref-type="fig" rid="F6">Figure 6</xref>, although all methods tend to under-segment fine blood vessels near vessel terminals, our method demonstrates superior vessel recognition compared to the others. Furthermore, methods such as SwinUnet (<xref ref-type="bibr" rid="B1">Cao et al., 2022</xref>), TransUnet <xref ref-type="bibr" rid="B3">Chen et al. (2021)</xref>, and CE-Net (<xref ref-type="bibr" rid="B11">Gu et al., 2019</xref>) exhibit more pronounced over-segmentation, primarily due to interference from artifacts and lesion areas. In contrast, our method mitigates the impact of these artifacts and noise, thereby reducing the over-segmentation problem.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Vessel segmentation results of different methods on PRIME-FP20 dataset, where the white, green, and red represent true positive, false negative, and false positive, respectively.</p>
</caption>
<graphic xlink:href="fcell-12-1532228-g006.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>4 Discussion</title>
<sec id="s4-1">
<title>4.1 Ablation studies</title>
<p>To evaluate the performance of the proposed method for retinal vessel segmentation and to further assess the effectiveness of each individual component, this section establishes various baselines for comparison. Extensive experiments are conducted on the publicly available dataset PRIME-FP20, utilizing identical image preprocessing and cropping methods across all baseline methods. As shown in <xref ref-type="table" rid="T2">Table 2</xref>, LPFM, SFM, and AUM components represent the local perception fusion module, the selective fusion module, and the multi-level attention upsampling module, respectively. The symbol <inline-formula id="inf151">
<mml:math id="m156">
<mml:mrow>
<mml:mi>&#x221a;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> denotes the inclusion of a component, while <inline-formula id="inf152">
<mml:math id="m157">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> indicates its exclusion. A comparative analysis of rows 3 to 6 demonstrates that the inclusion of each component significantly improves the results, highlighting their effectiveness. Specifically, incorporating the LPFM component alone improves our method&#x2019;s BACC, Sen, and Dice metrics by 1.11%, 2.21%, and 0.63%, respectively. Adding the SFM component alone outperforms the baseline method by 2.45%, 4.98%, and 2.09%, respectively. Including the AUM component alone surpasses the baseline method by 1.04%, 2.09%, and 0.96%, respectively. The SFM significantly enhances the segmentation performance of the method by introducing FFA features from the style transfer network. The LPFM enhances the network&#x2019;s multi-scale perception capability, while the AUM notably improves the results, particularly the sensitivity, indicating that it reduces feature loss during the upsampling process. Additionally, as depicted in rows 7 to 9 of <xref ref-type="table" rid="T2">Table 2</xref>, the combination of any two out of the three components also enhances performance. Specifically, adding the SFM yields a greater improvement than combining LPFM and AUM, suggesting that FFA features play a crucial role in enhancing retinal blood vessel segmentation in UWF fundus images. Finally, our method achieves better performance by integrating all these components.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>The vessel segmentation results of different baseline methods on PRIME-FP20 dataset.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th colspan="3" align="center">Methods</th>
<th colspan="1" align="center">
<italic>BACC(%)</italic>
<inline-formula id="inf153">
<mml:math id="m158">
<mml:mrow>
<mml:mi>&#x2191;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</th>
<th colspan="1" align="center">
<italic>Sen(%)</italic> <inline-formula id="inf154">
<mml:math id="m159">
<mml:mrow>
<mml:mi>&#x2191;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</th>
<th colspan="1" align="center">
<italic>Dice(%)</italic> <inline-formula id="inf155">
<mml:math id="m160">
<mml:mrow>
<mml:mi>&#x2191;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</th>
</tr>
<tr>
<th align="center">LPFM</th>
<th align="center">SFM</th>
<th align="center">AUM</th>
<th align="left"/>
<th align="left"/>
<th align="left"/>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">
<inline-formula id="inf156">
<mml:math id="m161">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<inline-formula id="inf157">
<mml:math id="m162">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<inline-formula id="inf158">
<mml:math id="m163">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">86.37 <inline-formula id="inf159">
<mml:math id="m164">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.46</td>
<td align="center">73.15 <inline-formula id="inf160">
<mml:math id="m165">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 2.97</td>
<td align="center">79.28 <inline-formula id="inf161">
<mml:math id="m166">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.08</td>
</tr>
<tr>
<td align="center">
<inline-formula id="inf162">
<mml:math id="m167">
<mml:mrow>
<mml:mi>&#x221a;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<inline-formula id="inf163">
<mml:math id="m168">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<inline-formula id="inf164">
<mml:math id="m169">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">87.48 <inline-formula id="inf165">
<mml:math id="m170">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.26</td>
<td align="center">75.36 <inline-formula id="inf166">
<mml:math id="m171">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 2.56</td>
<td align="center">79.91 <inline-formula id="inf167">
<mml:math id="m172">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.90</td>
</tr>
<tr>
<td align="center">
<inline-formula id="inf168">
<mml:math id="m173">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<inline-formula id="inf169">
<mml:math id="m174">
<mml:mrow>
<mml:mi>&#x221a;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<inline-formula id="inf170">
<mml:math id="m175">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">88.82 <inline-formula id="inf171">
<mml:math id="m176">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.38</td>
<td align="center">78.13 <inline-formula id="inf172">
<mml:math id="m177">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 2.83</td>
<td align="center">81.37 <inline-formula id="inf173">
<mml:math id="m178">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 0.64</td>
</tr>
<tr>
<td align="center">
<inline-formula id="inf174">
<mml:math id="m179">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<inline-formula id="inf175">
<mml:math id="m180">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<inline-formula id="inf176">
<mml:math id="m181">
<mml:mrow>
<mml:mi>&#x221a;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">87.41 <inline-formula id="inf177">
<mml:math id="m182">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.01</td>
<td align="center">75.24 <inline-formula id="inf178">
<mml:math id="m183">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 2.06</td>
<td align="center">80.24 <inline-formula id="inf179">
<mml:math id="m184">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.05</td>
</tr>
<tr>
<td align="center">
<inline-formula id="inf180">
<mml:math id="m185">
<mml:mrow>
<mml:mi>&#x221a;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<inline-formula id="inf181">
<mml:math id="m186">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<inline-formula id="inf182">
<mml:math id="m187">
<mml:mrow>
<mml:mi>&#x221a;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">91.49 <inline-formula id="inf183">
<mml:math id="m188">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.04</td>
<td align="center">83.63 <inline-formula id="inf184">
<mml:math id="m189">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 2.14</td>
<td align="center">82.34 <inline-formula id="inf185">
<mml:math id="m190">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 0.73</td>
</tr>
<tr>
<td align="center">
<inline-formula id="inf186">
<mml:math id="m191">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<inline-formula id="inf187">
<mml:math id="m192">
<mml:mrow>
<mml:mi>&#x221a;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<inline-formula id="inf188">
<mml:math id="m193">
<mml:mrow>
<mml:mi>&#x221a;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">91.05 <inline-formula id="inf189">
<mml:math id="m194">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 0.82</td>
<td align="center">82.67 <inline-formula id="inf190">
<mml:math id="m195">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.67</td>
<td align="center">82.85 <inline-formula id="inf191">
<mml:math id="m196">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 0.55</td>
</tr>
<tr>
<td align="center">
<inline-formula id="inf192">
<mml:math id="m197">
<mml:mrow>
<mml:mi>&#x221a;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<inline-formula id="inf193">
<mml:math id="m198">
<mml:mrow>
<mml:mi>&#x221a;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<inline-formula id="inf194">
<mml:math id="m199">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">92.60 <inline-formula id="inf195">
<mml:math id="m200">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 0.75</td>
<td align="center">85.94 <inline-formula id="inf196">
<mml:math id="m201">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 1.53</td>
<td align="center">82.73 <inline-formula id="inf197">
<mml:math id="m202">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 0.70</td>
</tr>
<tr>
<td align="center">
<inline-formula id="inf198">
<mml:math id="m203">
<mml:mrow>
<mml:mi>&#x221a;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<inline-formula id="inf199">
<mml:math id="m204">
<mml:mrow>
<mml:mi>&#x221a;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<inline-formula id="inf200">
<mml:math id="m205">
<mml:mrow>
<mml:mi>&#x221a;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<bold>93.15</bold> <inline-formula id="inf201">
<mml:math id="m206">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <bold>0.73</bold>
</td>
<td align="center">
<bold>87.17</bold> <inline-formula id="inf202">
<mml:math id="m207">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <bold>1.53</bold>
</td>
<td align="center">
<bold>83.02</bold> <inline-formula id="inf203">
<mml:math id="m208">
<mml:mrow>
<mml:mo>&#xb1;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <bold>0.70</bold>
</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>To further demonstrate the effectiveness of our method and its components, LPFM, SFM, and AUM. We also conducted the GradCAM (<xref ref-type="bibr" rid="B31">Selvaraju et al., 2017</xref>) visualization of the output from the final layer of the network decoder, as shown in <xref ref-type="fig" rid="F7">Figure 7</xref>. As observed in <xref ref-type="fig" rid="F7">Figures 7B, C</xref>, and <xref ref-type="fig" rid="F7">Figure 7D</xref>, the orange boxes indicate stronger responses to small blood vessels compared to <xref ref-type="fig" rid="F7">Figure 7A</xref>, particularly in <xref ref-type="fig" rid="F7">Figure 7C</xref>. This demonstrates the effectiveness of the designed components and underscores the advantages of incorporating the FFA modality for low-contrast vessel segmentation. Ultimately, by combining all three components, our method achieves superior vessel segmentation performance.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>It is the GradCAM visualization of the output from the final layer of the network decoder. Specifically, <bold>(A)</bold> The result obtained without adding any components. <bold>(B)</bold> The result LPFM. <bold>(C)</bold> The result of SFM. <bold>(D)</bold> The result with AUM. <bold>(E)</bold> The result of SFM &#x2b; AUM. <bold>(F)</bold> The result of LPFM &#x2b; SFM &#x2b; AUM.</p>
</caption>
<graphic xlink:href="fcell-12-1532228-g007.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="conclusion" id="s5">
<title>5 Conclusion</title>
<p>We propose an FFA-assisted multi-branch segmentation framework, named M3B-Net, for retinal blood vessel segmentation in UWF fundus images. This framework addresses the challenges of low segmentation accuracy and image boundary artifacts, which are caused by low contrast and the wide imaging range of UWF fundus images. To overcome these issues, M3B-Net integrates a segmentation approach based on style transfer, incorporating a selective fusion module and a multi-level attention upsampling module within the network. Comparative experiments are conducted on two datasets to highlight the superiority of our method, while ablation studies on a public dataset validate the effectiveness of each component. The experimental results demonstrate that our method achieves optimal performance in vessel segmentation of UWF fundus images, successfully overcoming the difficulties associated with segmenting fine blood vessels in these images.</p>
<p>UWF image segmentation enables the precise identification of retinal structures and lesions, facilitating the early detection of diseases such as diabetic retinopathy, age-related macular degeneration, and retinal vein occlusion. Early detection can lead to timely interventions and better patient outcomes. Automated segmentation reduces the reliance on manual annotations, minimizing inter-observer variability and improving diagnostic consistency. This helps ophthalmologists make more accurate and reliable clinical decisions. Therefore, we believe that our method better serves clinical applications by improving retinal vessel segmentation accuracy in UWF fundus images through the integration of the FFA image modality. However, our method may not be very efficient in terms of computational resource consumption. In the future, we will focus on addressing this issue.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s6">
<title>Data availability statement</title>
<p>The datasets presented in this article are not readily available because It contains private data. Requests to access the datasets should be directed to <email>jiong.zhang@ieee.org</email>.</p>
</sec>
<sec sec-type="ethics-statement" id="s7">
<title>Ethics statement</title>
<p>Written informed consent was obtained from the individual(s) for the publication of any potentially identifiable images or data included in this article.</p>
</sec>
<sec sec-type="author-contributions" id="s8">
<title>Author contributions</title>
<p>QX: Visualization, Writing&#x2013;original draft, Writing&#x2013;review and editing, Validation. XL: Data curation, Writing&#x2013;original draft, Writing&#x2013;review and editing, Software. YL: Writing&#x2013;review and editing, Project administration. JL: Writing&#x2013;review and editing, Software. SM: Writing&#x2013;review and editing, Conceptualization. YZ: Writing&#x2013;review and editing, Formal Analysis. JZ: Supervision, Writing&#x2013;original draft, Writing&#x2013;review and editing, Conceptualization, Funding acquisition.</p>
</sec>
<sec sec-type="funding-information" id="s9">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research, authorship, and/or publication of this article. This work was supported in part by the National Science Foundation Program of China (62103398, 62371442), in part by the Zhejiang Provincial Natural Science Foundation (LQ23F010002, LZ23F010002, LR24F010002), in part by Zhejiang Provincial Special Support Program for High-Level Talents (2021R52004).</p>
</sec>
<ack>
<p>We thank Ningbo Yinzhou People&#x2019;s Hospital for their invaluable assistance in collecting and annotating the private dataset used in this study.</p>
</ack>
<sec sec-type="COI-statement" id="s10">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s11">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
</sec>
<sec sec-type="disclaimer" id="s12">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Cao</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Tian</surname>
<given-names>Q.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). &#x201c;<article-title>Swin-unet: unet-like pure transformer for medical image segmentation</article-title>,&#x201d; in <conf-name>European conference on computer vision</conf-name>, <conf-loc>USA</conf-loc>, <conf-date>Oct 4th, 2024</conf-date> (<publisher-name>Springer</publisher-name>), <fpage>205</fpage>&#x2013;<lpage>218</lpage>.</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Hao</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Gu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yi</surname>
<given-names>Q.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Dual-path and multi-scale enhanced attention network for retinal diseases classification using ultra-wide-field images</article-title>. <source>IEEE Access</source> <volume>11</volume>, <fpage>45405</fpage>&#x2013;<lpage>45415</lpage>. <pub-id pub-id-type="doi">10.1109/access.2023.3273613</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Adeli</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Transunet: transformers make strong encoders for medical image segmentation</article-title>. <comment>
<italic>arXiv preprint arXiv:2102.04306</italic>
</comment>.</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ciresan</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Giusti</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Gambardella</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Schmidhuber</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Deep neural networks segment neuronal membranes in electron microscopy images</article-title>. <source>Adv. neural Inf. Process. Syst.</source> <volume>25</volume>.</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Deng</surname>
<given-names>X.-Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z.-X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>H.-X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.-Q.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Retinal vascular morphological characteristics in diabetic retinopathy: an artificial intelligence study using a transfer learning system to analyze ultra-wide field images</article-title>. <source>Int. J. Ophthalmol.</source> <volume>17</volume>, <fpage>1001</fpage>&#x2013;<lpage>1006</lpage>. <pub-id pub-id-type="doi">10.18240/ijo.2024.06.03</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Diakogiannis</surname>
<given-names>F. I.</given-names>
</name>
<name>
<surname>Waldner</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Caccetta</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Resunet-a: a deep learning framework for semantic segmentation of remotely sensed data</article-title>. <source>ISPRS J. Photogrammetry Remote Sens.</source> <volume>162</volume>, <fpage>94</fpage>&#x2013;<lpage>114</lpage>. <pub-id pub-id-type="doi">10.1016/j.isprsjprs.2020.01.013</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ding</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Kuriyan</surname>
<given-names>A. E.</given-names>
</name>
<name>
<surname>Ramchandran</surname>
<given-names>R. S.</given-names>
</name>
<name>
<surname>Wykoff</surname>
<given-names>C. C.</given-names>
</name>
<name>
<surname>Sharma</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Weakly-supervised vessel detection in ultra-widefield fundus photography via iterative multi-modal registration and learning</article-title>. <source>IEEE Trans. Med. Imaging</source> <volume>40</volume>, <fpage>2748</fpage>&#x2013;<lpage>2758</lpage>. <pub-id pub-id-type="doi">10.1109/TMI.2020.3027665</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fraz</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Basit</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Barman</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Application of morphological bit planes in retinal blood vessel extraction</article-title>. <source>J. digital imaging</source> <volume>26</volume>, <fpage>274</fpage>&#x2013;<lpage>286</lpage>. <pub-id pub-id-type="doi">10.1007/s10278-012-9513-3</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Fu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kee Wong</surname>
<given-names>D. W.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2016</year>). &#x201c;<article-title>Deepvessel: retinal vessel segmentation via deep learning and conditional random field</article-title>,&#x201d; in <conf-name>Medical Image Computing and Computer-Assisted Intervention&#x2013;MICCAI 2016: 19th International Conference</conf-name>, <conf-loc>Athens, Greece</conf-loc>, <conf-date>October 17-21, 2016</conf-date> (<publisher-name>Springer</publisher-name>), <fpage>132</fpage>&#x2013;<lpage>139</lpage>.</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gibson</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Giganti</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Bonmati</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Bandula</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Gurusamy</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Automatic multi-organ segmentation on abdominal ct with dense v-networks</article-title>. <source>IEEE Trans. Med. imaging</source> <volume>37</volume>, <fpage>1822</fpage>&#x2013;<lpage>1834</lpage>. <pub-id pub-id-type="doi">10.1109/TMI.2018.2806309</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Hao</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Ce-net: context encoder network for 2d medical image segmentation</article-title>. <source>IEEE Trans. Med. imaging</source> <volume>38</volume>, <fpage>2281</fpage>&#x2013;<lpage>2292</lpage>. <pub-id pub-id-type="doi">10.1109/TMI.2019.2903562</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Han</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Jian</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>G.-G.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Convunext: an efficient convolution neural network for medical image segmentation</article-title>. <source>Knowledge-Based Syst.</source> <volume>253</volume>, <fpage>109512</fpage>. <pub-id pub-id-type="doi">10.1016/j.knosys.2022.109512</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>He</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Ren</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2016</year>). &#x201c;<article-title>Deep residual learning for image recognition</article-title>,&#x201d; in <conf-name>Proceedings of the IEEE conference on computer vision and pattern recognition</conf-name>, <conf-loc>USA</conf-loc>, <conf-date>July 26 2017</conf-date>, <fpage>770</fpage>&#x2013;<lpage>778</lpage>.</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Imani</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Javidi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Pourreza</surname>
<given-names>H.-R.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Improvement of retinal blood vessel detection using morphological component analysis</article-title>. <source>Comput. methods programs Biomed.</source> <volume>118</volume>, <fpage>263</fpage>&#x2013;<lpage>279</lpage>. <pub-id pub-id-type="doi">10.1016/j.cmpb.2015.01.004</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ju</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Bonnington</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Drummond</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Ge</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Leveraging regular fundus images for training uwf fundus diagnosis models via adversarial learning and pseudo-labeling</article-title>. <source>IEEE Trans. Med. Imaging</source> <volume>40</volume>, <fpage>2911</fpage>&#x2013;<lpage>2925</lpage>. <pub-id pub-id-type="doi">10.1109/TMI.2021.3056395</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kamnitsas</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Ledig</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Newcombe</surname>
<given-names>V. F.</given-names>
</name>
<name>
<surname>Simpson</surname>
<given-names>J. P.</given-names>
</name>
<name>
<surname>Kane</surname>
<given-names>A. D.</given-names>
</name>
<name>
<surname>Menon</surname>
<given-names>D. K.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Efficient multi-scale 3d cnn with fully connected crf for accurate brain lesion segmentation</article-title>. <source>Med. image Anal.</source> <volume>36</volume>, <fpage>61</fpage>&#x2013;<lpage>78</lpage>. <pub-id pub-id-type="doi">10.1016/j.media.2016.10.004</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Kumar</surname>
<given-names>S. J. J.</given-names>
</name>
<name>
<surname>Ravichandran</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2017</year>). &#x201c;<article-title>Morphological operation detection of retinal image segmentation</article-title>,&#x201d; in <conf-name>2017 International Conference on Intelligent Sustainable Systems (ICISS)</conf-name>, <conf-loc>USA</conf-loc>, <conf-date>7-8 Dec. 2017</conf-date> (<publisher-name>IEEE</publisher-name>), <fpage>1228</fpage>&#x2013;<lpage>1235</lpage>.</citation>
</ref>
<ref id="B18">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Hao</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Qiao</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). &#x201c;<article-title>Privileged modality guided network for retinal vessel segmentation in ultra-wide-field images</article-title>,&#x201d; in <source>International workshop on ophthalmic medical image analysis</source> (<publisher-name>Springer</publisher-name>), <fpage>82</fpage>&#x2013;<lpage>91</lpage>.</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Teng</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>A new ultra-wide-field fundus dataset to diabetic retinopathy grading using hybrid preprocessing methods</article-title>. <source>Comput. Biol. Med.</source> <volume>157</volume>, <fpage>106750</fpage>. <pub-id pub-id-type="doi">10.1016/j.compbiomed.2023.106750</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Long</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Shelhamer</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Darrell</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2015</year>). &#x201c;<article-title>Fully convolutional networks for semantic segmentation</article-title>,&#x201d; in <conf-name>Proceedings of the IEEE conference on computer vision and pattern recognition</conf-name>, <conf-loc>USA</conf-loc>, <conf-date>7-8 Dec. 2017</conf-date>, <fpage>3431</fpage>&#x2013;<lpage>3440</lpage>.</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Memari</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Ramli</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Bin Saripan</surname>
<given-names>M. I.</given-names>
</name>
<name>
<surname>Mashohor</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Moghbel</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Supervised retinal vessel segmentation from color fundus images based on matched filtering and adaboost classifier</article-title>. <source>PloS one</source> <volume>12</volume>, <fpage>e0188939</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0188939</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mou</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Cs2-net: deep learning segmentation of curvilinear structures in medical imaging</article-title>. <source>Med. image Anal.</source> <volume>67</volume>, <fpage>101874</fpage>. <pub-id pub-id-type="doi">10.1016/j.media.2020.101874</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nguyen</surname>
<given-names>T. D.</given-names>
</name>
<name>
<surname>Le</surname>
<given-names>D.-T.</given-names>
</name>
<name>
<surname>Bum</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Song</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Choo</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Retinal disease diagnosis using deep learning on ultra-wide-field fundus images</article-title>. <source>Diagnostics</source> <volume>14</volume>, <fpage>105</fpage>. <pub-id pub-id-type="doi">10.3390/diagnostics14010105</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Oliveira</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Pereira</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Silva</surname>
<given-names>C. A.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Retinal vessel segmentation based on fully convolutional neural networks</article-title>. <source>Expert Syst. Appl.</source> <volume>112</volume>, <fpage>229</fpage>&#x2013;<lpage>242</lpage>. <pub-id pub-id-type="doi">10.1016/j.eswa.2018.06.034</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Ong</surname>
<given-names>I. S. Y.</given-names>
</name>
<name>
<surname>Lim</surname>
<given-names>L. T.</given-names>
</name>
<name>
<surname>Mahmood</surname>
<given-names>M. H.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>N. K.</given-names>
</name>
</person-group> (<year>2023</year>). &#x201c;<article-title>U-net segmentation of ultra-widefield retinal fundus images for retinal vein occlusion associated lesion recognition</article-title>,&#x201d; in <conf-name>2023 IEEE International Conference on Artificial Intelligence in Engineering and Technology (IICAIET) (IEEE)</conf-name>, <conf-loc>China</conf-loc>, <conf-date>12-14 Sept. 2023</conf-date>, <fpage>106</fpage>&#x2013;<lpage>111</lpage>. <pub-id pub-id-type="doi">10.1109/iicaiet59451.2023.10291722</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Orlando</surname>
<given-names>J. I.</given-names>
</name>
<name>
<surname>Prokofyeva</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Blaschko</surname>
<given-names>M. B.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>A discriminatively trained fully connected conditional random field model for blood vessel segmentation in fundus images</article-title>. <source>IEEE Trans. Biomed. Eng.</source> <volume>64</volume>, <fpage>16</fpage>&#x2013;<lpage>27</lpage>. <pub-id pub-id-type="doi">10.1109/TBME.2016.2535311</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Perone</surname>
<given-names>C. S.</given-names>
</name>
<name>
<surname>Cohen-Adad</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2018</year>). &#x201c;<article-title>Deep semi-supervised segmentation with weight-averaged consistency targets</article-title>,&#x201d; in <source>International workshop on deep learning in medical image analysis</source> (<publisher-name>Springer</publisher-name>), <fpage>12</fpage>&#x2013;<lpage>19</lpage>.</citation>
</ref>
<ref id="B28">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Ronneberger</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Fischer</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Brox</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2015</year>). &#x201c;<article-title>U-net: convolutional networks for biomedical image segmentation</article-title>,&#x201d; in <conf-name>Medical image computing and computer-assisted intervention&#x2013;MICCAI 2015: 18th international conference, Munich</conf-name>, <conf-loc>Germany</conf-loc>, <conf-date>October 5-9, 2015</conf-date> (<publisher-name>Springer</publisher-name>), <fpage>234</fpage>&#x2013;<lpage>241</lpage>.</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ryu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Rehman</surname>
<given-names>M. U.</given-names>
</name>
<name>
<surname>Nizami</surname>
<given-names>I. F.</given-names>
</name>
<name>
<surname>Chong</surname>
<given-names>K. T.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Segr-net: a deep learning framework with multi-scale feature fusion for robust retinal vessel segmentation</article-title>. <source>Comput. Biol. Med.</source> <volume>163</volume>, <fpage>107132</fpage>. <pub-id pub-id-type="doi">10.1016/j.compbiomed.2023.107132</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Seeb&#xf6;ck</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Orlando</surname>
<given-names>J. I.</given-names>
</name>
<name>
<surname>Schlegl</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Waldstein</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Bogunovi&#x107;</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Klimscha</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Exploiting epistemic uncertainty of anatomy segmentation for anomaly detection in retinal oct</article-title>. <source>IEEE Trans. Med. imaging</source> <volume>39</volume>, <fpage>87</fpage>&#x2013;<lpage>98</lpage>. <pub-id pub-id-type="doi">10.1109/TMI.2019.2919951</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Selvaraju</surname>
<given-names>R. R.</given-names>
</name>
<name>
<surname>Cogswell</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Das</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Vedantam</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Parikh</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Batra</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2017</year>). &#x201c;<article-title>Grad-cam: visual explanations from deep networks via gradient-based localization</article-title>,&#x201d; in <conf-name>Proceedings of the IEEE international conference on computer vision</conf-name>, <conf-loc>USA</conf-loc>, <conf-date>13-16 Oct. 2003</conf-date>, <fpage>618</fpage>&#x2013;<lpage>626</lpage>. <pub-id pub-id-type="doi">10.1109/iccv.2017.74</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Soares</surname>
<given-names>J. V.</given-names>
</name>
<name>
<surname>Leandro</surname>
<given-names>J. J.</given-names>
</name>
<name>
<surname>Cesar</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Jelinek</surname>
<given-names>H. F.</given-names>
</name>
<name>
<surname>Cree</surname>
<given-names>M. J.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Retinal vessel segmentation using the 2-d gabor wavelet and supervised classification</article-title>. <source>IEEE Trans. Med. Imaging</source> <volume>25</volume>, <fpage>1214</fpage>&#x2013;<lpage>1222</lpage>. <pub-id pub-id-type="doi">10.1109/tmi.2006.879967</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tang</surname>
<given-names>Q.-Q.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>X.-G.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.-Q.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>D.-W.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>M.-X.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Applications of deep learning for detecting ophthalmic diseases with ultrawide-field fundus images</article-title>. <source>Int. J. Ophthalmol.</source> <volume>17</volume>, <fpage>188</fpage>&#x2013;<lpage>200</lpage>. <pub-id pub-id-type="doi">10.18240/ijo.2024.01.24</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tavakkoli</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Kamran</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Hossain</surname>
<given-names>K. F.</given-names>
</name>
<name>
<surname>Zuckerbrod</surname>
<given-names>S. L.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>A novel deep learning conditional generative adversarial network for producing angiography images from retinal fundus photographs</article-title>. <source>Sci. Rep.</source> <volume>10</volume>, <fpage>21580</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-020-78696-2</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wan</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>A new segmentation algorithm for peripapillary atrophy and optic disk from ultra-widefield photographs</article-title>. <source>Comput. Biol. Med.</source> <volume>172</volume>, <fpage>108281</fpage>. <pub-id pub-id-type="doi">10.1016/j.compbiomed.2024.108281</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wan</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Liao</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Old photo restoration via deep latent space translation</article-title>. <source>IEEE Trans. Pattern Analysis Mach. Intell.</source> <volume>45</volume>, <fpage>2071</fpage>&#x2013;<lpage>2087</lpage>. <pub-id pub-id-type="doi">10.1109/TPAMI.2022.3163183</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Xin</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Q.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). &#x201c;<article-title>Advancing uwf-slo vessel segmentation with source-free active domain adaptation and a novel multi-center dataset</article-title>,&#x201d; in <conf-name>International Conference on Medical Image Computing and Computer-Assisted Intervention</conf-name>, <conf-loc>China</conf-loc>, <conf-date>03 October 2024</conf-date> (<publisher-name>Springer</publisher-name>), <fpage>75</fpage>&#x2013;<lpage>85</lpage>.</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhong</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Querying labeled for unlabeled: cross-image semantic consistency guided semi-supervised semantic segmentation</article-title>. <source>IEEE Trans. Pattern Analysis Mach. Intell.</source> <volume>45</volume>, <fpage>8827</fpage>&#x2013;<lpage>8844</lpage>. <pub-id pub-id-type="doi">10.1109/TPAMI.2022.3233584</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Yao</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Automatic segmentation of hemorrhages in the ultra-wide field retina: multi-scale attention subtraction networks and an ultra-wide field retinal hemorrhage dataset</article-title>. <source>IEEE J. Biomed. Health Inf.</source> <volume>28</volume>, <fpage>7369</fpage>&#x2013;<lpage>7381</lpage>. <pub-id pub-id-type="doi">10.1109/JBHI.2024.3457512</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Xia</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Song</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2018</year>). &#x201c;<article-title>Multiscale network followed network model for retinal vessel segmentation</article-title>,&#x201d; in <conf-name>Medical Image Computing and Computer Assisted Intervention&#x2013;MICCAI 2018: 21st International Conference</conf-name>, <conf-loc>Granada, Spain</conf-loc>, <conf-date>September 16-20, 2018</conf-date> (<publisher-name>Springer</publisher-name>), <fpage>119</fpage>&#x2013;<lpage>126</lpage>.</citation>
</ref>
<ref id="B41">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Xiao</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Lian</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2018</year>). &#x201c;<article-title>Weighted res-unet for high-quality retina vessel segmentation</article-title>,&#x201d; in <conf-name>2018 9th international conference on information technology in medicine and education (ITME)</conf-name>, <conf-loc>Spain</conf-loc>, <conf-date>September 16-20, 2018</conf-date> (<publisher-name>IEEE</publisher-name>), <fpage>327</fpage>&#x2013;<lpage>331</lpage>.</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yan</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>K.-T.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>A three-stage deep learning model for accurate retinal vessel segmentation</article-title>. <source>IEEE J. Biomed. Health Inf.</source> <volume>23</volume>, <fpage>1427</fpage>&#x2013;<lpage>1436</lpage>. <pub-id pub-id-type="doi">10.1109/JBHI.2018.2872813</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>W.-H.</given-names>
</name>
<name>
<surname>Shao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>Y.-W.</given-names>
</name>
</person-group>, (<year>2023</year>). <article-title>Guidelines on clinical research evaluation of artificial intelligence in ophthalmology (2023)</article-title>. <source>Int. J. Ophthalmol.</source> <volume>16</volume>, <fpage>1361</fpage>&#x2013;<lpage>1372</lpage>. <pub-id pub-id-type="doi">10.18240/ijo.2023.09.02</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yin</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Adel</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bourennane</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Retinal vessel segmentation using a probabilistic tracking method</article-title>. <source>Pattern Recognit.</source> <volume>45</volume>, <fpage>1235</fpage>&#x2013;<lpage>1244</lpage>. <pub-id pub-id-type="doi">10.1016/j.patcog.2011.09.019</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Dashtbozorg</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Bekkers</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Pluim</surname>
<given-names>J. P.</given-names>
</name>
<name>
<surname>Duits</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>ter Haar Romeny</surname>
<given-names>B. M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Robust retinal vessel segmentation via locally adaptive derivative frames in orientation scores</article-title>. <source>IEEE Trans. Med. imaging</source> <volume>35</volume>, <fpage>2631</fpage>&#x2013;<lpage>2644</lpage>. <pub-id pub-id-type="doi">10.1109/TMI.2016.2587062</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhong</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yi</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Deepuwf-plus: automatic fundus identification and diagnosis system based on ultrawide-field fundus imaging</article-title>. <source>Appl. Intell.</source> <volume>51</volume>, <fpage>7533</fpage>&#x2013;<lpage>7551</lpage>. <pub-id pub-id-type="doi">10.1007/s10489-021-02242-4</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Zhu</surname>
<given-names>J.-Y.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Isola</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Efros</surname>
<given-names>A. A.</given-names>
</name>
</person-group> (<year>2017</year>). &#x201c;<article-title>Unpaired image-to-image translation using cycle-consistent adversarial networks</article-title>,&#x201d; in <conf-name>Proceedings of the IEEE international conference on computer vision</conf-name>, <conf-loc>USA</conf-loc>, <conf-date>06 August 2002</conf-date>, <fpage>2223</fpage>&#x2013;<lpage>2232</lpage>.</citation>
</ref>
</ref-list>
</back>
</article>