<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Archiving and Interchange DTD v2.3 20070202//EN" "archivearticle.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="methods-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mar. Sci.</journal-id>
<journal-title>Frontiers in Marine Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mar. Sci.</abbrev-journal-title>
<issn pub-type="epub">2296-7745</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmars.2021.775433</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Marine Science</subject>
<subj-group>
<subject>Methods</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>A Deep Learning Model to Recognize and Quantitatively Analyze Cold Seep Substrates and the Dominant Associated Species</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Haining</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1472686/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Fu</surname> <given-names>Xiaoxue</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1495895/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhao</surname> <given-names>Chengqian</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Luan</surname> <given-names>Zhendong</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
<xref ref-type="aff" rid="aff7"><sup>7</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Li</surname> <given-names>Chaolun</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/785713/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Key Laboratory of Marine Ecology and Environmental Sciences, Institute of Oceanology, Chinese Academy of Sciences</institution>, <addr-line>Qingdao</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>University of Chinese Academy of Sciences</institution>, <addr-line>Beijing</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>Deep Sea Research Center, Institute of Oceanology, Chinese Academy of Sciences</institution>, <addr-line>Qingdao</addr-line>, <country>China</country></aff>
<aff id="aff4"><sup>4</sup><institution>Artificial Intelligence Lab, Qingdao University of Science and Technology</institution>, <addr-line>Qingdao</addr-line>, <country>China</country></aff>
<aff id="aff5"><sup>5</sup><institution>School of Information Science and Technology, Fudan University</institution>, <addr-line>Shanghai</addr-line>, <country>China</country></aff>
<aff id="aff6"><sup>6</sup><institution>Center for Ocean Mega-Science, Chinese Academy of Sciences</institution>, <addr-line>Qingdao</addr-line>, <country>China</country></aff>
<aff id="aff7"><sup>7</sup><institution>Key Laboratory of Marine Geology and Environment, Institute of Oceanology, Chinese Academy of Sciences</institution>, <addr-line>Qingdao</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Corrado Costa, Council for Agricultural and Economics Research (CREA), Italy</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Luciano Ortenzi, Council for Agricultural and Economics Research (CREA), Italy; Xikun Song, Xiamen University, China</p></fn>
<corresp id="c001">&#x002A;Correspondence: Chaolun Li, <email>lcl@qdio.ac.cn</email></corresp>
<fn fn-type="other" id="fn004"><p>This article was submitted to Deep-Sea Environments and Ecology, a section of the journal Frontiers in Marine Science</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>25</day>
<month>11</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>8</volume>
<elocation-id>775433</elocation-id>
<history>
<date date-type="received">
<day>14</day>
<month>09</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>29</day>
<month>10</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2021 Wang, Fu, Zhao, Luan and Li.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Wang, Fu, Zhao, Luan and Li</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>Characterizing habitats and species distribution is important to understand the structure and function of cold seep ecosystems. This paper develops a deep learning model for the fast and accurate recognition and classification of substrates and the dominant associated species in cold seeps. Considering the dense distribution of the dominant associated species and small objects caused by overlap in cold seeps, the feature pyramid network (FPN) embed into the faster region-convolutional neural network (R-CNN) was used to detect large-scale changes and small missing objects without increasing the number of calculations. We applied three classifiers (Faster R-CNN + FPN for mussel beds, lobster clusters and biological mixing, CNN for shell debris and exposed authigenic carbonates, and VGG16 for reduced sediments and muddy bottom) to improve the recognition accuracy of substrates. The model&#x2019;s results were manually verified using images obtained in the Formosa cold seep during a 2016 cruise. The recognition accuracy of the two dominant species, e.g., <italic>Gigantidas platifrons</italic> and Munidopsidae could be 70.85 and 56.16%, respectively. Seven subcategories of substrates were also classified with a mean accuracy of 74.87%. The developed model is a promising tool for the fast and accurate characterization of substrates and epifauna in cold seeps, which is crucial for large-scale quantitative analyses.</p>
</abstract>
<kwd-group>
<kwd>cold seep</kwd>
<kwd>substrates</kwd>
<kwd>epifauna</kwd>
<kwd>Faster R-CNN</kwd>
<kwd>FPN</kwd>
<kwd>VGG16</kwd>
</kwd-group>
<counts>
<fig-count count="9"/>
<table-count count="5"/>
<equation-count count="7"/>
<ref-count count="30"/>
<page-count count="11"/>
<word-count count="6632"/>
</counts>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="S1">
<title>Introduction</title>
<p>Cold seeps have been documented throughout global oceans along both active and passive continental margins (<xref ref-type="bibr" rid="B26">Sibuet and Olu, 1998</xref>). The fluids are enriched with reduced compounds from seabed support in distinctive chemoautotrophic ecosystems (<xref ref-type="bibr" rid="B3">Brooks et al., 1984</xref>; <xref ref-type="bibr" rid="B14">Kennicutt et al., 1988</xref>). Since their discovery in the Gulf of Mexico in 1983 (<xref ref-type="bibr" rid="B21">Paull et al., 1984</xref>), cold seep ecosystems have become &#x201C;hotspots&#x201D; of deep sea research due to the special lifestyles of animals, unique adaptations to extreme environments, and important roles in global geochemical cycles (<xref ref-type="bibr" rid="B6">Cordes et al., 2009</xref>; <xref ref-type="bibr" rid="B13">Joye, 2020</xref>). Most active cold seeps are generally characterized with a vast biomass but low diversity and are dominated by large symbiont-bearing invertebrates (<xref ref-type="bibr" rid="B20">Menot et al., 2010</xref>). These invertebrates are considered the ecosystem engineers and influence the sediment environment, provide physical structure and modulate geochemistry through oxygenation (pumping) and ion uptake activities (<xref ref-type="bibr" rid="B15">Levin, 2005</xref>). To understand the structure and function of cold seep ecosystems, it is essential to comprehensively describe the distribution of the major habitats and epifauna. However, the topography of cold seep areas is usually complex and heterogeneous. Additionally, the epifauna present a patchy distribution as influenced by discontinued and scattered seep points. It is difficult to obtain complete and comprehensive community information in a traditional way (physical collection, such as epibenthic sled, grab, etc.) due to the region&#x2019;s high randomness and low representation (<xref ref-type="bibr" rid="B16">Levin et al., 2000</xref>). Alternatively, <xref ref-type="bibr" rid="B25">Sen et al. (2016)</xref> used multibeam backscatter and bathymetry to obtain complete data for cold seeps. Improved camera (<xref ref-type="bibr" rid="B19">MacDonald et al., 2003</xref>; <xref ref-type="bibr" rid="B11">Hsu et al., 2018</xref>; <xref ref-type="bibr" rid="B24">Sen et al., 2019</xref>) and video technologies (<xref ref-type="bibr" rid="B25">Sen et al., 2016</xref>) were also applied, but the subsequent data processing was time-consuming and laborious.</p>
<p>Deep learning is considered one of the major breakthroughs in the artificial intelligence over the past decade and has been widely used in multiple fields including image analysis, target detection, and computer version (<xref ref-type="bibr" rid="B10">Han et al., 2020</xref>). This method can be divided into three steps. First, the deep neural network is used to automatically extract features from the target. Then, the model is trained using manually annotated datasets. Finally, the trained model is used to identify the target. Compared with error-prone human performances, deep learning has the unique capability of reducing time and workloads while providing higher reliabilities and accuracies (<xref ref-type="bibr" rid="B22">Raphael et al., 2020</xref>). Major deep learning models include convolutional neural networks (CNN; <xref ref-type="bibr" rid="B2">Albawi et al., 2017</xref>), recurrent (<xref ref-type="bibr" rid="B5">Cho et al., 2014</xref>) and recursive neural networks (<xref ref-type="bibr" rid="B9">Goodfellow et al., 2016</xref>), and generative adversarial networks (<xref ref-type="bibr" rid="B7">Creswell et al., 2018</xref>). The CNN uses convolutions (special linear operations) in at least one layer of the network instead of typical matrix multiplication operations, which is to process data with grid-like structures. Recurrent neural networks are used to process sequential data and can learn nonlinear features of sequences with high efficiencies. The potential use of recurrent neural networks for learning inferences has been successfully applied to networks with data structure inputs. Generative adversarial networks are based on microgenerators and solve problems by learning new samples from the training set. Generative adversarial networks are based on a game theory scenario in which generators must compete with adversaries (discriminators).</p>
<p>With the development of deep learning, an increasing number of target detection and recognition method have been applied to marine research. The CNN is an efficient deep learning model that can be used to extract profile feature information as it can reduce the network structure complexity as well as the number of parameters through local receptive fields, weight sharing, and pooling operations, while also actively extracting high-dimensional features from big data (<xref ref-type="bibr" rid="B4">Chen et al., 2021</xref>). CNN image processing was customized by <xref ref-type="bibr" rid="B30">Zuazo et al. (2020)</xref> to extract biological information of the bubblegum coral <italic>Paragorgia arborea</italic> from times series. <xref ref-type="bibr" rid="B8">Elawady (2015)</xref> used a CNN to classify deep-sea coral reefs, which could achieve autonomous coral repairing combined with autonomous underwater vehicles. The Fast R-CNN was applied by <xref ref-type="bibr" rid="B12">Huang et al. (2019)</xref> to detect and identify marine organisms with three data augmentation methods expanded a small number of samples. <xref ref-type="bibr" rid="B18">Lu et al. (2017)</xref> used the &#x201C;You Only Look Once: YOLO&#x201D; approach to recognize and track marine organisms including shrimp, squid, crab and shark. While each of these methods has certain advantages, they show weakness for small-sized target identification and accuracies in cold seeps due to the high habitat heterogeneity caused by complex carbonate rocks and dense organism collections. To adapt to the special environment of cold seeps, it is necessary to develop a new algorithm for substrates and epifauna recognition.</p>
<p>When performing multi-scale target detection, traditional algorithms generally use reduced or expanded images as inputs to generate feature combinations that reflect features at different scales (<xref ref-type="bibr" rid="B1">Adelson et al., 1983</xref>). The mainstream deep learning networks currently adopt a single high-level feature for detection. However, the reduced pixel information in small targets make them easily lost in the down-sampling processing. The dominant associated species in cold seeps are relatively smaller in size with a greater community density. Embedding the feature pyramid network (FPN; <xref ref-type="bibr" rid="B17">Lin et al., 2017</xref>) structure into the Faster R-CNN (<xref ref-type="bibr" rid="B23">Ren et al., 2015</xref>) is a potential solution to improve the detection of small and medium-sized targets.</p>
<p>This paper develops a model to accurately identify substrates and the dominant associated species in cold seeps. Image of the Formosa cold seep collected in the South China Sea were used to train and verify the model.</p>
</sec>
<sec id="S2">
<title>Model Building</title>
<sec id="S2.SS1">
<title>Image Collection and Data Set Production</title>
<p>An imaging and laser profiling system mounted on a remotely operated vehicle (ROV) was used to collect a series of adjacent images with geographic coordinates by the R.V. <italic>Kexue</italic> in 2016. ROV traveled at a speed of 1.5&#x2013;2 knots and 2&#x2013;3 meters above the seabed. Nine images per second was shot and these images can distinguish individuals larger than 1 cm. Geographic coordinates and the same object identifier in adjacent images were used to splice an initial mosaic. The mosaic color was finally uniformed to produce the Mosaic (<xref ref-type="fig" rid="F1">Figure 1A</xref>). For the subsequent training experimental data set and model verification, the Mosaic was divided into 19,516 small images (cut by 200 &#x00D7; 200 and removing blank images). The upper part of the Mosaic was manually tagged for the data set and the other parts were used for the model verification experiment. Tagging targets (<xref ref-type="fig" rid="F1">Figure 1</xref>) primarily includes: (1) the dominant associated species [<italic>Gigantidas platifrons</italic> (<italic>G</italic>. <italic>platifrons</italic>) and Munidopsidae], (2) hard substrates (mussel beds, lobster clusters, biological mixing, shell debris, and exposed authigenic carbonates) and soft substrates (reduced sediments and muddy bottom). The classification of substrates is specified in <xref ref-type="table" rid="T1">Table 1</xref>.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p><bold>(A)</bold> Mosaic (20,000 m<sup>2</sup>) of Formosa ridge cold seep from 2016. The outline represents the area where images were obtained and the red frame is the training set. The hard substrates are: <bold>(B)</bold> mussel beds, <bold>(C)</bold> lobster clusters, <bold>(D)</bold> biological mixing, <bold>(E)</bold> shell debris, and <bold>(F)</bold> exposed authigenic carbonates. The soft substrates are the <bold>(G)</bold> reduced sediments and <bold>(H)</bold> muddy bottom. The dominant species in cold seep are <bold>(I)</bold> <italic>Gigantidas platifrons</italic> and <bold>(J)</bold> Munidopsidae.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-08-775433-g001.tif"/>
</fig>
<table-wrap position="float" id="T1">
<label>TABLE 1</label>
<caption><p>Definitions and descriptions of the two main substrates (seven small classifications).</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left" colspan="2">Substrata classifications</td>
<td valign="top" align="left">Description</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Hard substrates (Carbonate rocks)</td>
<td valign="top" align="left">Mussel beds (B)</td>
<td valign="top" align="left">Large number (&#x003E;50 ind./m<sup>2</sup>) of <italic>G. platifrons</italic> and small number (&#x003C;20 ind./m<sup>2</sup>) of Munidopsidae</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Lobster clusters (C)</td>
<td valign="top" align="left">Large number (&#x003E;50 ind./m<sup>2</sup>) of Munidopsidae and small number (&#x003C;20 ind./m<sup>2</sup>) of <italic>G. platifrons</italic></td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Biological mixing (D)</td>
<td valign="top" align="left">Large number (&#x003E;20 ind./m<sup>2</sup>) of Munidopsidae and <italic>G. platifrons</italic></td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Shell debris (E)</td>
<td valign="top" align="left">Open and empty mussel shells or white shell hash</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Exposed authigenic carbonates (F)</td>
<td valign="top" align="left">Bare and hard authigenic carbonate rocks or boulders, or isolated pieces of carbonate rock surrounded by sediment</td>
</tr>
<tr>
<td valign="top" align="left">Soft substrates</td>
<td valign="top" align="left">Reduced sediments (G)</td>
<td valign="top" align="left">Black or purple stained sediment</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Muddy bottom (H)</td>
<td valign="top" align="left">Significant ordinary argillaceous environment</td>
</tr>
</tbody>
</table></table-wrap>
</sec>
<sec id="S2.SS2">
<title>Model Framework</title>
<sec id="S2.SS2.SSS1">
<title>Faster Region-Convolutional Neural Network + Feature Pyramid Network Algorithm for Epifauna Detection</title>
<p>To find an algorithm suitable to detect cold seep epifauna, we considered two-stage (Faster R-CNN base model and our improved model) and single-stage [including SSD300 (<xref ref-type="bibr" rid="B29">Wang et al., 2017</xref>) and YOLOv3] detection algorithms to test the same epifauna dataset. The results showed that the two-stage detection model performed better for the average precision (<xref ref-type="table" rid="T2">Table 2</xref>). Thus, it was more suitable to detect and count cold seep epifauna. However, two-stage detection models are not suitable for real-time target detection because of their relatively lower speeds over single-stage detection. Compared with the original Faster R-CNN structure and other algorithms, the improved algorithm developed in this paper has a higher detection accuracy. Although the detection time increases, the improvement was acceptable relative to the performance. The Fast R-CNN + FPN model was chosen for the recognition of cold seep substrates and epifauna.</p>
<table-wrap position="float" id="T2">
<label>TABLE 2</label>
<caption><p>The comparison of different models.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Model</td>
<td valign="top" align="center">Density of the dominant associated species (ind./m<sup>2</sup>)</td>
<td valign="top" align="center">Number of images</td>
<td valign="top" align="center">AP</td>
<td valign="top" align="center">Speed/ms</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">SSD300</td>
<td valign="top" align="center">&#x003E;50</td>
<td valign="top" align="center">100</td>
<td valign="top" align="center">&#x003C;0.6</td>
<td valign="top" align="center">102</td>
</tr>
<tr>
<td valign="top" align="left">YOLOv3</td>
<td valign="top" align="center">&#x003E;50</td>
<td valign="top" align="center">100</td>
<td valign="top" align="center">&#x003C;0.6</td>
<td valign="top" align="center">63</td>
</tr>
<tr>
<td valign="top" align="left">Faster R-CNN</td>
<td valign="top" align="center">&#x003E;50</td>
<td valign="top" align="center">100</td>
<td valign="top" align="center">&#x003C;0.7</td>
<td valign="top" align="center">159</td>
</tr>
<tr>
<td valign="top" align="left">Faster R-CNN+FPN</td>
<td valign="top" align="center">&#x003E;50</td>
<td valign="top" align="center">100</td>
<td valign="top" align="center">0.738</td>
<td valign="top" align="center">164</td>
</tr>
</tbody>
</table></table-wrap>
<p>The pyramid form of the CNN used in the FPN effectively generates multi-scale feature expressions under a single image view. The FPN structure was designed with a top-down structure while lateral connections fused the shallow high-resolution feature map with the deep feature map having rich semantic information. Embedding the FPN structure in the Faster R-CNN allowed quickly building a feature pyramid with strong semantic information at all scales that could significantly improve the detection capability of the network for small-scale targets (<xref ref-type="bibr" rid="B17">Lin et al., 2017</xref>). The FPN structure is showed in <xref ref-type="fig" rid="F2">Figure 2</xref>, where bottom-up usually refers to the forward computing process of the backbone; top-down uses nearest-neighbor interpolation for up-sampling on the higher-level feature map which could retain the semantic information of the feature map to the maximum extent; and the lateral connection adjusts the feature dimension with a 1 &#x00D7; 1 convolution to ensure consistent corresponding feature layer dimensions between the bottom-up process and the top-down processes. Then, the 3 &#x00D7; 3 convolution operation was aimed at eliminating the blending effect generated in the feature fusion process.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>Structure of the feature pyramid network (FPN) algorithm. Top-down structure was designed in the FPN structure while the lateral connections fused the shallow feature map.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-08-775433-g002.tif"/>
</fig>
<p>Embedding the FPN structure in the Faster R-CNN fused the deep and shallow features, which strengthened the feature expression ability of the network and effectively improved its accuracy for small target detection. In addition, ResNet50 (<xref ref-type="bibr" rid="B28">Szegedy et al., 2017</xref>) was used to replace the VGG16 (<xref ref-type="bibr" rid="B27">Simonyan and Zisserman, 2014</xref>) as the backbone feature extraction network of the Faster R-CNN to further improve the network capabilities.</p>
<p>The network architecture of the improved Faster R-CNN algorithm is shown in <xref ref-type="fig" rid="F3">Figure 3</xref>. The feature fusion maps for different levels as extracted by the FPN were separately fed into the region proposal network (RPN) network. This network generated anchor frames with different aspect ratios based on the different feature map scale sizes and selected the corresponding detection layer for the target. The region of interest (ROI) pooled the corresponding region into a fixed-size feature vector in the feature map based on the position coordinates of the candidate regions.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p>Network architecture of the improved Faster region-convolutional neural network (R-CNN) algorithm, which contains the FPN and region proposal network (RPN).</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-08-775433-g003.tif"/>
</fig>
<p>We set a binary label for each anchor to judge whether it was a target or not to train the RPN. We set a binary label for each anchor to judge whether it was a target or not: we set a positive label for all anchors whose intersection over union (IOU) was greater than or equal to 0.7. We then set a negative labor for all anchors with IOU less than 0.3 for the real box. The loss function of a single image is defined as:</p>
<disp-formula id="S2.Ex1">
<mml:math id="M1" display="block">
<mml:mrow>
<mml:mrow>
<mml:mtext mathvariant="bold-italic">L</mml:mtext>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:msub>
<mml:mtext mathvariant="bold-italic">P</mml:mtext>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
<mml:mo>}</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:msub>
<mml:mtext mathvariant="bold-italic">t</mml:mtext>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
<mml:mo>}</mml:mo>
</mml:mrow>
<mml:mo rspace="0.8pt">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo rspace="0.8pt">=</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mfrac>
<mml:mn mathvariant="bold">1</mml:mn>
<mml:msub>
<mml:mtext mathvariant="bold-italic">N</mml:mtext>
<mml:mi mathvariant="bold-italic">cls</mml:mi>
</mml:msub>
</mml:mfrac>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:munder>
<mml:mo largeop="true" movablelimits="false" symmetric="true">&#x2211;</mml:mo>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:munder>
<mml:mrow>
<mml:msub>
<mml:mtext mathvariant="bold-italic">L</mml:mtext>
<mml:mi mathvariant="bold-italic">cls</mml:mi>
</mml:msub>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mtext mathvariant="bold-italic">P</mml:mtext>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msubsup>
<mml:mtext mathvariant="bold-italic">P</mml:mtext>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mo>&#x002A;</mml:mo>
</mml:msubsup>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold">&#x03BB;</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mfrac>
<mml:mn mathvariant="bold">1</mml:mn>
<mml:msub>
<mml:mtext mathvariant="bold-italic">N</mml:mtext>
<mml:mi mathvariant="bold-italic">reg</mml:mi>
</mml:msub>
</mml:mfrac>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:munder>
<mml:mo largeop="true" movablelimits="false" symmetric="true">&#x2211;</mml:mo>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:munder>
<mml:mrow>
<mml:msubsup>
<mml:mtext mathvariant="bold-italic">P</mml:mtext>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mo>&#x002A;</mml:mo>
</mml:msubsup>
<mml:mo>&#x2062;</mml:mo>
<mml:msub>
<mml:mtext mathvariant="bold-italic">L</mml:mtext>
<mml:mi mathvariant="bold-italic">reg</mml:mi>
</mml:msub>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mtext mathvariant="bold-italic">t</mml:mtext>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
<mml:mo rspace="7.5pt">,</mml:mo>
<mml:msubsup>
<mml:mtext mathvariant="bold-italic">t</mml:mtext>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mo>&#x002A;</mml:mo>
</mml:msubsup>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <italic>i</italic> is the index of the candidate box in a batch of data, <italic>P</italic><sub><italic>i</italic></sub> is the prediction probability of the <italic>i</italic> th candidate box as the target. If the candidate box is positive, the real label <italic>P</italic><sub><italic>i</italic></sub> = 1; otherwise, <inline-formula><mml:math id="INEQ2"><mml:mrow><mml:mpadded width="+3.3pt"><mml:msubsup><mml:mi>P</mml:mi><mml:mi>i</mml:mi><mml:mo>&#x002A;</mml:mo></mml:msubsup></mml:mpadded><mml:mo rspace="5.8pt">=</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:math></inline-formula>. The &#x03BB; is the normalized weight with &#x03BB;=10 set in the experiment, and <italic>t</italic><sub><italic>i</italic></sub> is the four parameterized coordinate vectors of the prediction box and was the real box vector related to positive samples. The <italic>N</italic><sub><italic>cls</italic></sub> is the batch size in the training process, <italic>N</italic><sub><italic>reg</italic></sub> is the number of candidate boxes, and <italic>L</italic><sub><italic>cls</italic></sub> is the binary logarithm loss and defined as:</p>
<disp-formula id="S2.Ex2">
<mml:math id="M2" display="block">
<mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mtext mathvariant="bold-italic">L</mml:mtext>
<mml:mi mathvariant="bold-italic">cls</mml:mi>
</mml:msub>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mtext mathvariant="bold-italic">P</mml:mtext>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msubsup>
<mml:mtext mathvariant="bold-italic">P</mml:mtext>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mo>&#x002A;</mml:mo>
</mml:msubsup>
<mml:mo rspace="5.8pt">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo rspace="5.8pt">=</mml:mo>
<mml:mrow>
<mml:mo>-</mml:mo>
<mml:mrow>
<mml:mtext mathvariant="bold-italic">ln</mml:mtext>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mtext mathvariant="bold-italic">P</mml:mtext>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
<mml:mo>&#x2062;</mml:mo>
<mml:msubsup>
<mml:mtext mathvariant="bold-italic">P</mml:mtext>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mo>&#x002A;</mml:mo>
</mml:msubsup>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mn mathvariant="bold">1</mml:mn>
<mml:mo>-</mml:mo>
<mml:msubsup>
<mml:mtext mathvariant="bold-italic">P</mml:mtext>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mo>&#x002A;</mml:mo>
</mml:msubsup>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mn mathvariant="bold">1</mml:mn>
<mml:mo>-</mml:mo>
<mml:msub>
<mml:mtext mathvariant="bold-italic">P</mml:mtext>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mrow>
<mml:mo>]</mml:mo>
</mml:mrow>
<mml:mo>&#x2062;</mml:mo>
<mml:mtext mathvariant="bold-italic">s</mml:mtext>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<p>The <italic>L</italic><sub><italic>reg</italic></sub> is the regression loss function and is defined as:</p>
<disp-formula id="S2.Ex3">
<mml:math id="M3" display="block">
<mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mtext mathvariant="bold-italic">L</mml:mtext>
<mml:mi mathvariant="bold-italic">reg</mml:mi>
</mml:msub>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mtext mathvariant="bold-italic">t</mml:mtext>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msubsup>
<mml:mtext mathvariant="bold-italic">t</mml:mtext>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mo>&#x002A;</mml:mo>
</mml:msubsup>
<mml:mo rspace="5.8pt">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo rspace="5.8pt">=</mml:mo>
<mml:mrow>
<mml:munder>
<mml:mo largeop="true" movablelimits="false" symmetric="true">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:mo stretchy="false">|</mml:mo>
<mml:mi mathvariant="bold-italic">x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="bold-italic">w</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="bold-italic">h</mml:mi>
<mml:mo stretchy="false">|</mml:mo>
</mml:mrow>
</mml:munder>
<mml:mrow>
<mml:mtext mathvariant="bold-italic">smooth</mml:mtext>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mtext mathvariant="bold-italic">t</mml:mtext>
<mml:mi mathvariant="bold">i</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msubsup>
<mml:mtext mathvariant="bold">t</mml:mtext>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mo>&#x002A;</mml:mo>
</mml:msubsup>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where the smooth function is defined as:</p>
<disp-formula id="S2.Ex4">
<mml:math id="M4" display="block">
<mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mtext mathvariant="bold-italic">smooth</mml:mtext>
<mml:mi mathvariant="bold-italic">L1</mml:mi>
</mml:msub>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi mathvariant="bold-italic">x</mml:mi>
<mml:mo rspace="5.8pt">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo rspace="5.8pt">=</mml:mo>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mtable displaystyle="true" rowspacing="0pt">
<mml:mtr>
<mml:mtd columnalign="center">
<mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mn mathvariant="bold">0.5</mml:mn>
<mml:mo>&#x2062;</mml:mo>
<mml:msup>
<mml:mtext mathvariant="bold-italic">x</mml:mtext>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:msup>
<mml:mo>&#x2062;</mml:mo>
<mml:mstyle displaystyle="false">
<mml:mfrac>
<mml:mn mathvariant="bold">1</mml:mn>
<mml:msup>
<mml:mi mathvariant="normal">&#x03C3;</mml:mi>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:msup>
</mml:mfrac>
</mml:mstyle>
</mml:mrow>
<mml:mo rspace="7.5pt">,</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">|</mml:mo>
<mml:mi mathvariant="bold-italic">x</mml:mi>
<mml:mo rspace="5.8pt" stretchy="false">|</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo rspace="5.8pt">&#x2264;</mml:mo>
<mml:mstyle displaystyle="false">
<mml:mfrac>
<mml:mn mathvariant="bold">1</mml:mn>
<mml:msup>
<mml:mi mathvariant="normal">&#x03C3;</mml:mi>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:msup>
</mml:mfrac>
</mml:mstyle>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd columnalign="center">
<mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mi mathvariant="bold-italic">x</mml:mi>
<mml:mo>|</mml:mo>
</mml:mrow>
<mml:mo>-</mml:mo>
<mml:mn mathvariant="bold">0.5</mml:mn>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="bold-italic">others</mml:mi>
</mml:mrow>
</mml:mtd>
</mml:mtr>
</mml:mtable>
<mml:mi/>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <italic>x</italic> is the error of the border prediction and &#x03C3; is used to control the smooth area with a values of 3 in the experiment.</p>
</sec>
<sec id="S2.SS2.SSS2">
<title>Substrates Recognition Algorithm</title>
<p>The complexity of cold seep substrates and the problems of color bias, dark light and blur in underwater images made it difficult to distinguish all substrate categories using a single classifier. This paper adopted an integration strategy to improve the accuracy of recognition and classification accuracies. In the classification, several base classifiers responsible for distinguishing part of the data were connected in series. The undifferentiated data went to the subsequent base classifier to achieve the optimal results in the iteration.</p>
<p>The associated substrate classification model framework is shown in <xref ref-type="fig" rid="F4">Figure 4</xref>. The first classification model was the FPN embedded in the Faster R-CNN to classify and count the biota. The images that did not satisfy the current classification conditions were passed to the next CNN model, which classified the zones of shell debris and exposed authigenic carbonates. Then, the images that did not satisfy these classification conditions continued to the VGG16 model for binary classification which was responsible for identifying the reduced sediment and muddy bottom zones.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p>Substrate classification model framework with the three classifiers of FPN, convolutional neural network (CNN), and VGG16 to identify the cold seep substrates.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-08-775433-g004.tif"/>
</fig>
<p>The first base of the integrated classifier in the figure consists of the improved Faster R-CNN and FPN from the section &#x201C;Faster R-CNN + FPN Algorithm for Epifauna Detection.&#x201D; The backbone network used for feature extraction in the model, which could greatly improve the feature extraction capability was replaced by VGG16 with ResNet50 as fused with the FPN. The first base classifier was mainly responsible for biota classification. The FPN was embedded into the Faster RCNN to reduce the redundant multi-resolution feature map detection from the original structure based on the realization of feature fusion. Nearest-neighbor upsampling was used to fuse the shallow location and deep semantic information of the network. With only a small increase in computational costs, the detection accuracy of the network for multi-scale targets was greatly improved. Classification and identification allowed counting the epifauna. Then, the zones of the lobster cluster, mussel bed and biological mixing were distinguished using the substrate classification rules.</p>
<p>The second base classifier consisted of the CNN which was aimed primarily at the recognition and classification of the shell debris and carbonate rock zones. This structure could reduce the amount of memory occupied by the deep network, effectively reduce the number of network parameters, and alleviate the overfitting problem of the model. As a supervised multilayer learning neural network, the implicit convolutional and pooling layers were the core modules to realize feature extraction in the CNN. The CNN improved the accuracy of the network through frequent iterative training by minimizing the loss function using the gradient descent method and adjusting the weight parameters in the network layer by layer in reverse (<xref ref-type="bibr" rid="B2">Albawi et al., 2017</xref>). The low hidden layer of the CNN consisted of alternating convolutional and maximum pooling layers, and the high level was a fully connected layer corresponding to the implicit layer and logistic regression classifier of a traditional multilayer perceptron. The input of the first fully-connected layer was a feature map obtained <italic>via</italic> feature extraction from the convolutional and subsampling layers. The final output layer was a classifier for the input image using logistic regression, Softmax regression, or support vector machines. In this paper, a Softmax nonlinear classifier was used to identify and classify the zones of shell debris and exposed authigenic carbonates.</p>
<p>The third base classifier was aimed at the recognition and classification of reduced sediments and muddy bottoms. The VGG16 was composed of five convolutional layers, three fully-connected layers, and an output layer. The layers were separated by a maximum pooling layer and a ReLU activation function for all implicit activation units. On one hand, the convolutional layers with larger kernels could reduce the parameters. On the other hand, these were equivalent to more nonlinear mappings which could increase the expressive power of the network (<xref ref-type="bibr" rid="B27">Simonyan and Zisserman, 2014</xref>). However, the nonlinear classifier Softmax was still used for identification and classification.</p>
</sec>
</sec>
<sec id="S2.SS3">
<title>Model Training and Verification</title>
<sec id="S2.SS3.SSS1">
<title>Epifauna Quantitative Identification Experiments</title>
<p>The Faster R-CNN can be divided into two parts: the RPN and Fast R-CNN network. The former is a recommendation algorithm for candidate boxes (proposal), and the latter is based on the position of the box where the associated categories of objects are calculated. The RPN was trained first, and the Fast R-CNN was trained with the output (proposal) of the RPN. Fast R-CNN was fine-tuned and used to initialize the RPN parameters, which gives an iterative cycle.</p>
<p>The experimental data were 630 images (randomly selected from the upper part of the Mosaic), and the MRLabeler v1.4 software was used for annotation. The model could achieve the best effect when the learning rate was 0.001, the weight decay was set to 0.0004, the anchor scaling multiple was set to (8, 16, 32), and the scaling ratio was (0.5, 1, 2). To avoid overfitting, the impulse gradient was used with impulse of 0.9. The entire experiment was conducted on a Linux CentOS 7 server, and two NVIDIA GeForce GTX 1080ti graphics processing units (GPUs) with 12GB of memory were synchronized. The in-depth learning framework was implemented with tensorflow version 1.11.0 on the GPU. During training, the positive samples were labeled with IOU values greater than 0.7 and negative samples for those less than 0.3. The optimal model was saved after training and used to count the test data set.</p>
<p>The results of each experiment were evaluated using the Recall, Precision and Accuracy (AP). The Recall and Precision are defined as:</p>
<disp-formula id="S2.Ex5">
<mml:math id="M5" display="block">
<mml:mrow>
<mml:mtext mathvariant="bold-italic">Precision</mml:mtext>
<mml:mo rspace="5.8pt">=</mml:mo>
<mml:mfrac>
<mml:mtext mathvariant="bold-italic">TP</mml:mtext>
<mml:mrow>
<mml:mtext mathvariant="bold-italic">TP</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext mathvariant="bold-italic">FP</mml:mtext>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="S2.Ex6">
<mml:math id="M6" display="block">
<mml:mrow>
<mml:mtext mathvariant="bold-italic">Recall</mml:mtext>
<mml:mo rspace="5.8pt">=</mml:mo>
<mml:mfrac>
<mml:mtext mathvariant="bold-italic">TP</mml:mtext>
<mml:mrow>
<mml:mtext mathvariant="bold-italic">TP</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext mathvariant="bold-italic">FN</mml:mtext>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where the definitions of TP, TN, FP, and FN as shown in <xref ref-type="table" rid="T3">Table 3</xref> denotes true-positive, true-negative, false-positive, and false-negative identifications, respectively. The Precision denotes the proportion of all targets predicted to be correct and the Recall denotes the proportion of targets identified by the correct localization to the total number of targets.</p>
<table-wrap position="float" id="T3">
<label>TABLE 3</label>
<caption><p>Obfuscation matrix for specified categories.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Ground truth predictive</td>
<td valign="top" align="center">Positive</td>
<td valign="top" align="center">Negative</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Positive</td>
<td valign="top" align="center">True positive (TP)</td>
<td valign="top" align="center">False negative (FN)</td>
</tr>
<tr>
<td valign="top" align="left">Negative</td>
<td valign="top" align="center">False positive (FP)</td>
<td valign="top" align="center">True negative (TN)</td>
</tr>
</tbody>
</table></table-wrap>
</sec>
<sec id="S2.SS3.SSS2">
<title>Substrate Identification and Classification Experiments</title>
<p>The MRLabeler v1.4 software was used to label the 1,501 images (randomly selected from the upper part of the Mosaic) in the experimental data set. The specific classification of substrates is shown in <xref ref-type="table" rid="T1">Table 1</xref>. A total of 303 images were obtained from the biota data set, including 15 images of lobster clusters, 240 images of mussel beds, and 48 images of biological mixing areas. There were 1,198 images of abiotic areas, including 284 of shell debris areas, 107 of exposed authigenic carbonates, 19 of reduced sediments and 788 of muddy bottoms.</p>
<p>The training parameters were set so the first base classifier was the same as the FPN + Faster R -CNN model in the section &#x201C;Faster R-CNN + FPN Algorithm for Epifauna Detection.&#x201D; In the second and third base classifiers, the convolution kernel was 3 &#x00D7; 3 and the step size was 1. To ensure optimal performance of each classifier, every detector was trained separately.</p>
</sec>
</sec>
<sec id="S2.SS4">
<title>Accuracy Verification Experiment</title>
<p>A total of 6,000 images randomly selected from the remaining parts of the Mosaic were used to test the error in the model. The error mean for epifauna was calculated as:</p>
<disp-formula id="S2.Ex7">
<mml:math id="M7" display="block">
<mml:mrow>
<mml:mtext mathvariant="bold-italic">E</mml:mtext>
<mml:mo rspace="5.8pt">=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mo largeop="true" symmetric="true">&#x2211;</mml:mo>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mi mathvariant="bold-italic">n</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:mo stretchy="false">|</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">x</mml:mi>
<mml:mi mathvariant="bold-italic">ir</mml:mi>
</mml:msub>
<mml:mo>-</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">x</mml:mi>
<mml:mi mathvariant="bold-italic">in</mml:mi>
</mml:msub>
</mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">x</mml:mi>
<mml:mi mathvariant="bold-italic">in</mml:mi>
</mml:msub>
</mml:mfrac>
<mml:mo stretchy="false">|</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mtext mathvariant="bold-italic">n</mml:mtext>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <italic>i</italic> is the image index, <italic>n</italic> is the number of images, and <italic>x</italic><sub><italic>ir</italic></sub> and <italic>x</italic><sub><italic>in</italic></sub> are the number of epifauna in the images identified by the model and manually counted, respectively. The error mean of the substrates is determined by whether the substrate is correctly identified. The Surfer software was used to show the distribution of substrates and epifauna.</p>
</sec>
</sec>
<sec id="S3">
<title>Training and Verification Results and Discussion</title>
<sec id="S3.SS1">
<title>Model Training Results</title>
<p>The results show that the Recall, Precision and AP of the Munidopsidae were all greater than the <italic>G. platifrons</italic> (<xref ref-type="table" rid="T4">Table 4</xref>). The experimental model training achieved a mean average precision of 73.8% on the epifauna dataset, and the recognition accuracy of <italic>G. platifrons</italic> and Munidopsidae were 72.0 and 75.6%, respectively. The experimental results are visualized in <xref ref-type="fig" rid="F5">Figure 5</xref>. The experiments indicate that the improved algorithm greatly enhances the accuracy of recognition and counting of cold seep epifauna over other existing methods (<xref ref-type="table" rid="T2">Table 2</xref>).</p>
<table-wrap position="float" id="T4">
<label>TABLE 4</label>
<caption><p>Experimental results of the dominant associated species.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Folds</td>
<td valign="top" align="center">Recall</td>
<td valign="top" align="center">Precision</td>
<td valign="top" align="center">AP</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left"><italic>G</italic>. <italic>platifrons</italic></td>
<td valign="top" align="center">0.745</td>
<td valign="top" align="center">0.719</td>
<td valign="top" align="center">0.720</td>
</tr>
<tr>
<td valign="top" align="left">Munidopsidae</td>
<td valign="top" align="center">0.876</td>
<td valign="top" align="center">0.755</td>
<td valign="top" align="center">0.756</td>
</tr>
</tbody>
</table></table-wrap>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p>Recognition results for <italic>G</italic>. <italic>platifrons</italic> and Munidopsidae as represented as green and pink frames, respectively.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-08-775433-g005.tif"/>
</fig>
<p>The accuracy of the ensemble classifier was more than 80% (<xref ref-type="table" rid="T5">Table 5</xref>), and the soft substrates (reduced sediment and muddy bottom) had relatively higher accuracies than hard substrates. Thus, the accuracy of cold seep substrate classification could be greatly improved using the proposed algorithm.</p>
<table-wrap position="float" id="T5">
<label>TABLE 5</label>
<caption><p>Experimental results of the substrates on the test set where (B) to (H) represent the different substrates defined in <xref ref-type="table" rid="T1">Table 1</xref>.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Category</td>
<td valign="top" align="center"><italic>n</italic></td>
<td valign="top" align="center">FPN false detection</td>
<td valign="top" align="center">CNN false detection</td>
<td valign="top" align="center">VGG16 false detection</td>
<td valign="top" align="center">Total number of false checks</td>
<td valign="top" align="center">Accuracy</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">B</td>
<td valign="top" align="center">240</td>
<td valign="top" align="center">&#x2013;</td>
<td/>
<td/>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x003E;0.8</td>
</tr>
<tr>
<td valign="top" align="left">C</td>
<td valign="top" align="center">15</td>
<td valign="top" align="center">&#x2013;</td>
<td/>
<td/>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x003E;0.8</td>
</tr>
<tr>
<td valign="top" align="left">D</td>
<td valign="top" align="center">48</td>
<td valign="top" align="center">8</td>
<td/>
<td/>
<td valign="top" align="center">8</td>
<td valign="top" align="center">0.83</td>
</tr>
<tr>
<td valign="top" align="left">E</td>
<td valign="top" align="center">284</td>
<td valign="top" align="center">14</td>
<td valign="top" align="center">34</td>
<td/>
<td valign="top" align="center">48</td>
<td valign="top" align="center">0.83</td>
</tr>
<tr>
<td valign="top" align="left">F</td>
<td valign="top" align="center">107</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">13</td>
<td/>
<td valign="top" align="center">13</td>
<td valign="top" align="center">0.87</td>
</tr>
<tr>
<td valign="top" align="left">G</td>
<td valign="top" align="center">19</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">0.89</td>
</tr>
<tr>
<td valign="top" align="left">H</td>
<td valign="top" align="center">788</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">10</td>
<td valign="top" align="center">16</td>
<td valign="top" align="center">26</td>
<td valign="top" align="center">0.97</td>
</tr>
</tbody>
</table></table-wrap>
</sec>
<sec id="S3.SS2">
<title>Model Verification Results</title>
<p>The FPN structure embed into the Faster R-CNN was well adapted to the identification difficulties caused by the particularity of cold seeps. Although single-stage detection algorithms have relatively fast speeds compared with two-stage approaches, these are not suitable for the detection and counting of cold seep epifauna due to the lower average precision. The dominant species (<italic>G. platifrons</italic> and Munidopsidae) were the main objects of interest. The recognition results indicate that this model weas helpful to detect cold seep epifauna (<italic>G. platifrons</italic> and Munidopsidae) with a relatively high recognition accuracy (<xref ref-type="fig" rid="F5">Figure 5</xref>). Our study showed that the recognition errors of <italic>G. platifrons</italic> were lower than Munidopsidae with a range of 0 to 300% and a mean of 29.15%. The recognition errors for Munidopsidae were higher with a range of 0 to 1,650% and a mean of 43.84%. Without calculating the limited epifauna areas, the error means of the two species reached 26.88 and 39.11%, respectively. The different error ranges of <italic>G. platifrons</italic> were relatively uniform while the Munidopsidae had large differences with concentrations in 0&#x2013;10 and &#x003E;50% (<xref ref-type="fig" rid="F6">Figure 6</xref>). Except for the density of 11&#x2013;20 individual/m<sup>2</sup> (ind./m<sup>2</sup>) for Munidopsidae, there were high error means in the range of 0&#x2013;50 ind./m<sup>2</sup> for these two species. The error means were all reduced in the range of 50&#x2013;100 ind./m<sup>2</sup>. The <italic>G. platifrons</italic> had the lowest error mean for 151&#x2013;200 ind./m<sup>2</sup> at 19.37 &#x00B1; 43.70%, while the Munidopsidae for 81&#x2013;90 ind./m<sup>2</sup> had an error of 27.73 &#x00B1; 24.65%. Both species had low errors at relatively high densities. This also means that our model could meet the needs of cold seep scientific research with dense epifauna. The complexity of cold seep environments and epifauna density were the main reason for changes in the recognition accuracy. The difficulty of identifying <italic>G. platifrons</italic> was that their shells were similar in color to their surroundings, which created high false positives for the background carbonate rocks. The irregular shape and lamination were the main difficulties for Munidopsidae recognition. The image processing (such as sharpening and contrast stretching) and algorithm still require further improvements.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption><p>Error mean for different densities about the dominant species and the number of images with different errors.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-08-775433-g006.tif"/>
</fig>
<p>Several classifiers with different emphases improved the accuracy and interpretability of cold seep substrate classification. Two main substrates (hard and soft) and seven small classifications were defined in <xref ref-type="table" rid="T1">Table 1</xref>. A total of 480 images of biotas and 5,520 images of abiotic zones were tested, and the error mean of all substrates reached 25.13%. Biological mixing (2.44%), muddy bottom (15.95%), mussel beds (18.54%), and shell debris (28.17%) had relatively lower error means while the exposed authigenic carbonates (40.55%), lobster clusters (51.72%), and reduced sediments (76.30%) had higher error means (<xref ref-type="fig" rid="F7">Figure 7</xref>). The color of the reduced sediments (black and purple) and the exposed authigenic carbonates (gray) were easily confused with the dark surroundings. So, the model may be improved in conjunction with the application of image enhancement technologies.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption><p>Error means for different substrates.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-08-775433-g007.tif"/>
</fig>
<p>The recognition and statistical results provide the spatial distribution of substrates and epifaunas in the entire mosaic (<xref ref-type="fig" rid="F8">Figures 8</xref>, <xref ref-type="fig" rid="F9">9</xref>). Overall, the model identifications of substrates and epifaunas were nearly the same as manual processes. For epifauna, the identification results showed that the total number of <italic>G. platifrons</italic> and Munidopsidae were 1,75,661 and 24,157 ind. while there were actually 2,15,512 and 37,422 ind., respectively. The identifications in high-density areas were insufficient while some areas with no epifauna showed an excess of false positives. For the substrates, except for the relatively high differences in reduced sediments, the substrate identification was nearly the same as manual operations. The proposed model could be an effective method for the recognition and classification of substrates and epifauna regardless of the number of images.</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption><p>Spatial distribution of <italic>G. platifrons</italic> and Munidopsidae. The results for <italic>G. platifrons</italic> with <bold>(A)</bold> manual counting and <bold>(B)</bold> model identification, and for Munidopsidae with <bold>(C)</bold> manual counting and <bold>(D)</bold> model identification. The large black and gray colored region are hard and soft substrate, respectively.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-08-775433-g008.tif"/>
</fig>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption><p>Spatial distribution of different substrates, with <bold>(A)</bold> manual counting and <bold>(B)</bold> model identification, respectively.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-08-775433-g009.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="conclusion" id="S4">
<title>Conclusion</title>
<p>This paper developed a model to automatically identify and count cold seeps substrates and the dominant associated species. The approach can significantly improve the accuracy of mapping habitats and species distributions, which ensures the sustainable exploitation and utilization of cold seeps. Considering the high heterogeneity of cold seep areas, this will help further cold seep research. The use of the Faster R-CNN + FPN and several integrated classifiers were proven as effective to solve this problem. The classification and recognition of substrates in cold seeps were first applied. To improve the accuracy, future work will focus on image enhancements and algorithm improvements.</p>
</sec>
<sec sec-type="data-availability" id="S5">
<title>Data Availability Statement</title>
<p>Publicly available datasets were analyzed in this study. This data can be found here: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.12157/IOCAS.20211029.001">doi: 10.12157/IOCAS.20211029.001</ext-link>.</p>
</sec>
<sec id="S6">
<title>Author Contributions</title>
<p>HW and CL: conceptualization. HW, XF, and ZL: data curation. HW and XF: formal analysis and software and writing&#x2014;original draft. CL: funding acquisition and writing&#x2014;review and editing. HW, XF, and CZ: methodology. HW: validation. All authors agreed to be accountable for the content of the work.</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s7">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
</body>
<back>
<sec sec-type="funding-information" id="s8">
<title>Funding</title>
<p>This work was supported by the National Natural Science Foundation of China (42030407 and 42076091), the Strategic Priority Research Program of the Chinese Academy of Sciences (XDA22050303, XDB42020401, and XDA22050302), the National Key R&#x0026;D Program of the Ministry of Science and Technology (2018YFC0310802), and the Youth Innovation Promotion Association of the Chinese Academy of Sciences. The samples and data were collected by the R.V. <italic>Kexue</italic>.</p>
</sec>
<ack>
<p>We thank Bin Zhang and Yuhai Liu for the helping of project implementation. We appreciate the Marine Science Data Center of the Chinese Academy of Sciences for providing data services.</p>
</ack>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Adelson</surname> <given-names>E. H.</given-names></name> <name><surname>Anderson</surname> <given-names>C. H.</given-names></name> <name><surname>Bergen</surname> <given-names>J. R.</given-names></name> <name><surname>Burt</surname> <given-names>P. J.</given-names></name> <name><surname>Ogden</surname> <given-names>J. M.</given-names></name></person-group> (<year>1983</year>). <article-title>Pyramid methods in image processing.</article-title> <source><italic>RCA Eng.</italic></source> <volume>29</volume> <fpage>33</fpage>&#x2013;<lpage>41</lpage>.</citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Albawi</surname> <given-names>S.</given-names></name> <name><surname>Mohammed</surname> <given-names>T. A.</given-names></name> <name><surname>Al-Zawi</surname> <given-names>S.</given-names></name></person-group> (<year>2017</year>). &#x201C;<article-title>Understanding of a convolutional neural network</article-title>,&#x201D; in <source><italic>Proceedings of the 2017 International Conference on Engineering and Technology (ICET)</italic></source>, <publisher-loc>Antalya</publisher-loc>, <fpage>1</fpage>&#x2013;<lpage>6</lpage>.</citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Brooks</surname> <given-names>J. M.</given-names></name> <name><surname>Kennicutt</surname> <given-names>M. C.</given-names></name> <name><surname>Fay</surname> <given-names>R. R.</given-names></name> <name><surname>McDonald</surname> <given-names>T. J.</given-names></name> <name><surname>Sassen</surname> <given-names>R.</given-names></name></person-group> (<year>1984</year>). <article-title>Thermogenic gas hydrates in the Gulf of Mexico.</article-title> <source><italic>Science</italic></source> <volume>225</volume> <fpage>409</fpage>&#x2013;<lpage>411</lpage>. <pub-id pub-id-type="doi">10.1126/science.225.4660.409</pub-id> <pub-id pub-id-type="pmid">17813260</pub-id></citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>X.</given-names></name> <name><surname>Chen</surname> <given-names>G.</given-names></name> <name><surname>Ge</surname> <given-names>L.</given-names></name> <name><surname>Huang</surname> <given-names>B.</given-names></name> <name><surname>Cao</surname> <given-names>C.</given-names></name></person-group> (<year>2021</year>). <article-title>Global oceanic eddy identification: a deep learning method from argo profiles and altimetry data.</article-title> <source><italic>Front. Mar. Sci.</italic></source> <volume>8</volume>:<fpage>646926</fpage>. <pub-id pub-id-type="doi">10.3389/fmars.2021.646926</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cho</surname> <given-names>K.</given-names></name> <name><surname>Van Merri&#x00EB;nboer</surname> <given-names>B.</given-names></name> <name><surname>Gulcehre</surname> <given-names>C.</given-names></name> <name><surname>Bahdanau</surname> <given-names>D.</given-names></name> <name><surname>Bougares</surname> <given-names>F.</given-names></name> <name><surname>Schwenk</surname> <given-names>H.</given-names></name><etal/></person-group> (<year>2014</year>). &#x201C;<article-title>Learning phrase representations using RNN encoder-decoder for statistical machine translation</article-title>,&#x201D; in <source><italic>Proceedings of the 2014 Conference on Empirical Methods in Natural Language Processing (EMNLP)</italic></source>, <publisher-loc>Doha</publisher-loc>, <fpage>1724</fpage>&#x2013;<lpage>1734</lpage>.</citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cordes</surname> <given-names>E. E.</given-names></name> <name><surname>Bergquist</surname> <given-names>D. C.</given-names></name> <name><surname>Fisher</surname> <given-names>C. R.</given-names></name></person-group> (<year>2009</year>). <article-title>Macro-ecology of gulf of mexico cold seeps.</article-title> <source><italic>Annu. Rev. Mar. Sci.</italic></source> <volume>1</volume> <fpage>143</fpage>&#x2013;<lpage>168</lpage>. <pub-id pub-id-type="doi">10.1146/annurev.marine.010908.163912</pub-id> <pub-id pub-id-type="pmid">21141033</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Creswell</surname> <given-names>A.</given-names></name> <name><surname>White</surname> <given-names>T.</given-names></name> <name><surname>Dumoulin</surname> <given-names>V.</given-names></name> <name><surname>Arulkumaran</surname> <given-names>K.</given-names></name> <name><surname>Sengupta</surname> <given-names>B.</given-names></name> <name><surname>Bharath</surname> <given-names>A. A.</given-names></name></person-group> (<year>2018</year>). <article-title>Generative adversarial networks: an overview.</article-title> <source><italic>IEEE Signal Process. Mag.</italic></source> <volume>35</volume> <fpage>53</fpage>&#x2013;<lpage>65</lpage>. <pub-id pub-id-type="doi">10.3115/v1/D14-1179</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Elawady</surname> <given-names>M.</given-names></name></person-group> (<year>2015</year>). <source><italic>Sparse coral classification using deep convolutional neural.</italic></source> <comment>Dissertation/master&#x2019;s thesis</comment>, <publisher-name>Heriot-Watt University, Scotland (Edinburgh)</publisher-name>.</citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Goodfellow</surname> <given-names>I.</given-names></name> <name><surname>Bengio</surname> <given-names>Y.</given-names></name> <name><surname>Courville</surname> <given-names>A.</given-names></name></person-group> (<year>2016</year>). &#x201C;<article-title>Recursive Neural Networks</article-title>,&#x201D; in <source><italic>Deep Learning</italic></source>, <role>eds</role> <person-group person-group-type="editor"><name><surname>Gutierrez</surname> <given-names>D.</given-names></name> <name><surname>LeCun</surname> <given-names>Y.</given-names></name></person-group> (<publisher-loc>Cambridge, MA</publisher-loc>: <publisher-name>MIT press</publisher-name>), <fpage>400</fpage>&#x2013;<lpage>401</lpage>.</citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Han</surname> <given-names>F.</given-names></name> <name><surname>Yao</surname> <given-names>J.</given-names></name> <name><surname>Zhu</surname> <given-names>H.</given-names></name> <name><surname>Wang</surname> <given-names>C.</given-names></name></person-group> (<year>2020</year>). <article-title>Marine organism detection and classification from underwater vision based on the deep CNN method.</article-title> <source><italic>Math. Prob. Eng.</italic></source> <volume>2020</volume> <fpage>1</fpage>&#x2013;<lpage>11</lpage>. <pub-id pub-id-type="doi">10.1155/2020/3937580</pub-id></citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hsu</surname> <given-names>H.-H.</given-names></name> <name><surname>Liu</surname> <given-names>C.-S.</given-names></name> <name><surname>Morita</surname> <given-names>S.</given-names></name> <name><surname>Tu</surname> <given-names>S.-L.</given-names></name> <name><surname>Lin</surname> <given-names>S.</given-names></name> <name><surname>Machiyama</surname> <given-names>H.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Seismic imaging of the Formosa Ridge cold seep site offshore of southwestern Taiwan.</article-title> <source><italic>Mar. Geophys. Res.</italic></source> <volume>39</volume> <fpage>523</fpage>&#x2013;<lpage>535</lpage>. <pub-id pub-id-type="doi">10.1007/s11001-017-9339-y</pub-id></citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>H.</given-names></name> <name><surname>Zhou</surname> <given-names>H.</given-names></name> <name><surname>Yang</surname> <given-names>X.</given-names></name> <name><surname>Zhang</surname> <given-names>L.</given-names></name> <name><surname>Qi</surname> <given-names>L.</given-names></name> <name><surname>Zang</surname> <given-names>A.-Y.</given-names></name></person-group> (<year>2019</year>). <article-title>Faster R-CNN for marine organisms detection and recognition using data augmentation.</article-title> <source><italic>Neurocomputing</italic></source> <volume>337</volume> <fpage>372</fpage>&#x2013;<lpage>384</lpage>. <pub-id pub-id-type="doi">10.1016/j.neucom.2019.01.084</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Joye</surname> <given-names>S. B.</given-names></name></person-group> (<year>2020</year>). <article-title>The geology and biogeochemistry of hydrocarbon seeps.</article-title> <source><italic>Annu. Rev. Earth Planet. Sci.</italic></source> <volume>48</volume> <fpage>205</fpage>&#x2013;<lpage>31</lpage>. <pub-id pub-id-type="doi">10.1146/annurev-earth-063016-020052</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kennicutt</surname> <given-names>M. C.</given-names></name> <name><surname>Brooks</surname> <given-names>J. M.</given-names></name> <name><surname>Bidigare</surname> <given-names>R. R.</given-names></name> <name><surname>Denoux</surname> <given-names>G. J.</given-names></name></person-group> (<year>1988</year>). <article-title>Gulf of Mexico hydrocarbon seep communities&#x2014;I. Regional distribution of hydrocarbon seepage and associated fauna.</article-title> <source><italic>Deep Sea Res. Part I Oceanogr. Res. Papers</italic></source> <volume>35</volume> <fpage>1639</fpage>&#x2013;<lpage>1651</lpage>. <pub-id pub-id-type="doi">10.1016/0198-0149(88)90107-0</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Levin</surname> <given-names>L. A.</given-names></name></person-group> (<year>2005</year>). &#x201C;<article-title>Ecology of cold seep sediments: interactions of fauna with flow, chemistry and microbes</article-title>,&#x201D; in <source><italic>Oceanography and Marine Biology - An Annual Review</italic></source>, <volume>Vol. 43</volume> <role>eds</role> <person-group person-group-type="editor"><name><surname>Gibson</surname> <given-names>R. N.</given-names></name> <name><surname>Atkinson</surname> <given-names>R. J. A.</given-names></name> <name><surname>Gordon</surname> <given-names>J. D. M.</given-names></name></person-group> (<publisher-loc>Boca Raton, FL</publisher-loc>: <publisher-name>CRC Press</publisher-name>), <fpage>1</fpage>&#x2013;<lpage>46</lpage>. <pub-id pub-id-type="doi">10.1201/9781420037449.ch1</pub-id></citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Levin</surname> <given-names>L. A.</given-names></name> <name><surname>James</surname> <given-names>D. W.</given-names></name> <name><surname>Martin</surname> <given-names>C. M.</given-names></name> <name><surname>Rathburn</surname> <given-names>A. E.</given-names></name> <name><surname>Harris</surname> <given-names>L. H.</given-names></name> <name><surname>Michener</surname> <given-names>R. H.</given-names></name></person-group> (<year>2000</year>). <article-title>Do methane seeps support distinct epifaunal assemblages? Observations on community structure and nutrition from the northern California slope and shelf.</article-title> <source><italic>Mar. Ecol. Prog. Ser.</italic></source> <volume>208</volume> <fpage>21</fpage>&#x2013;<lpage>39</lpage>. <pub-id pub-id-type="doi">10.3354/meps208021</pub-id></citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lin</surname> <given-names>T.-Y.</given-names></name> <name><surname>Doll&#x00E1;r</surname> <given-names>P.</given-names></name> <name><surname>Girshick</surname> <given-names>R.</given-names></name> <name><surname>He</surname> <given-names>K.</given-names></name> <name><surname>Hariharan</surname> <given-names>B.</given-names></name> <name><surname>Belongie</surname> <given-names>S.</given-names></name></person-group> (<year>2017</year>). &#x201C;<article-title>Feature pyramid networks for object detection</article-title>,&#x201D; in <source><italic>Proceedings of the IEEE conference on computer vision and pattern recognition</italic></source>, <publisher-loc>San Juan, PR</publisher-loc>, <fpage>2117</fpage>&#x2013;<lpage>2125</lpage>.</citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lu</surname> <given-names>H.</given-names></name> <name><surname>Li</surname> <given-names>Y.</given-names></name> <name><surname>Uemura</surname> <given-names>T.</given-names></name> <name><surname>Ge</surname> <given-names>Z.</given-names></name> <name><surname>Xu</surname> <given-names>X.</given-names></name> <name><surname>He</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>FDCNet: filtering deep convolutional network for marine organism classification.</article-title> <source><italic>Multimed. Tools Appl.</italic></source> <volume>77</volume> <fpage>21847</fpage>&#x2013;<lpage>21860</lpage>. <pub-id pub-id-type="doi">10.1007/s11042-017-4585-1</pub-id></citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>MacDonald</surname> <given-names>I. R.</given-names></name> <name><surname>Sager</surname> <given-names>W. W.</given-names></name> <name><surname>Peccini</surname> <given-names>M. B.</given-names></name></person-group> (<year>2003</year>). <article-title>Gas hydrate and chemosynthetic biota in mounded bathymetry at mid-slope hydrocarbon seeps: Northern Gulf of Mexico.</article-title> <source><italic>Mar. Geol.</italic></source> <volume>198</volume> <fpage>133</fpage>&#x2013;<lpage>158</lpage>. <pub-id pub-id-type="doi">10.1016/s0025-3227(03)00098-7</pub-id></citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Menot</surname> <given-names>L.</given-names></name> <name><surname>Galeron</surname> <given-names>J.</given-names></name> <name><surname>Olu</surname> <given-names>K.</given-names></name> <name><surname>Caprais</surname> <given-names>J.-C.</given-names></name> <name><surname>Crassous</surname> <given-names>P.</given-names></name> <name><surname>Khripounoff</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2010</year>). <article-title>Spatial heterogeneity of macrofaunal communities in and near a giant pockmark area in the deep Gulf of Guinea.</article-title> <source><italic>Mar. Ecol. Evol. Perspect.</italic></source> <volume>31</volume> <fpage>78</fpage>&#x2013;<lpage>93</lpage>. <pub-id pub-id-type="doi">10.1111/j.1439-0485.2009.00340.x</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Paull</surname> <given-names>C. K.</given-names></name> <name><surname>Hecker</surname> <given-names>B.</given-names></name> <name><surname>Commeau</surname> <given-names>R.</given-names></name> <name><surname>Freeman-Lynde</surname> <given-names>R. P.</given-names></name> <name><surname>Neumann</surname> <given-names>C.</given-names></name> <name><surname>Corso</surname> <given-names>W. P.</given-names></name><etal/></person-group> (<year>1984</year>). <article-title>Biological communities at the Florida Escarpment resemble hydrothermal vent taxa.</article-title> <source><italic>Science</italic></source> <volume>226</volume> <fpage>965</fpage>&#x2013;<lpage>967</lpage>. <pub-id pub-id-type="doi">10.1126/science.226.4677.965</pub-id> <pub-id pub-id-type="pmid">17737352</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Raphael</surname> <given-names>A.</given-names></name> <name><surname>Dubinsky</surname> <given-names>Z.</given-names></name> <name><surname>Iluz</surname> <given-names>D.</given-names></name> <name><surname>Netanyahu</surname> <given-names>N. S.</given-names></name></person-group> (<year>2020</year>). <article-title>Neural network recognition of marine benthos and corals.</article-title> <source><italic>Diversity</italic></source> <volume>12</volume>:<fpage>29</fpage>. <pub-id pub-id-type="doi">10.3390/d12010029</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ren</surname> <given-names>S.</given-names></name> <name><surname>He</surname> <given-names>K.</given-names></name> <name><surname>Girshick</surname> <given-names>R.</given-names></name> <name><surname>Sun</surname> <given-names>J.</given-names></name></person-group> (<year>2015</year>). <article-title>Faster R-CNN: towards real-time object detection with region proposal networks.</article-title> <source><italic>IEEE Trans. Pattern Anal. Machine Intell.</italic></source> <volume>28</volume> <fpage>91</fpage>&#x2013;<lpage>99</lpage>. <pub-id pub-id-type="doi">10.1109/TPAMI.2016.2577031</pub-id> <pub-id pub-id-type="pmid">27295650</pub-id></citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sen</surname> <given-names>A.</given-names></name> <name><surname>Chitkara</surname> <given-names>C.</given-names></name> <name><surname>Hong</surname> <given-names>W. L.</given-names></name> <name><surname>Lepland</surname> <given-names>A.</given-names></name> <name><surname>Cochrane</surname> <given-names>S.</given-names></name> <name><surname>di Primio</surname> <given-names>R.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Image based quantitative comparisons indicate heightened megabenthos diversity and abundance at a site of weak hydrocarbon seepage in the southwestern Barents Sea.</article-title> <source><italic>PeerJ</italic></source> <volume>7</volume>:<fpage>e7398</fpage>. <pub-id pub-id-type="doi">10.7717/peerj.7398</pub-id> <pub-id pub-id-type="pmid">31410307</pub-id></citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sen</surname> <given-names>A.</given-names></name> <name><surname>Ondr&#x00E9;as</surname> <given-names>H.</given-names></name> <name><surname>Gaillot</surname> <given-names>A.</given-names></name> <name><surname>Marcon</surname> <given-names>Y.</given-names></name> <name><surname>Augustin</surname> <given-names>J.-M.</given-names></name> <name><surname>Olu</surname> <given-names>K.</given-names></name></person-group> (<year>2016</year>). <article-title>The use of multibeam backscatter and bathymetry as a means of identifying faunal assemblages in a deep-sea cold seep.</article-title> <source><italic>Deep Sea Res. Part I Oceanogr. Res. Papers</italic></source> <volume>110</volume> <fpage>33</fpage>&#x2013;<lpage>49</lpage>. <pub-id pub-id-type="doi">10.1016/j.dsr.2016.01.005</pub-id></citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sibuet</surname> <given-names>M.</given-names></name> <name><surname>Olu</surname> <given-names>K.</given-names></name></person-group> (<year>1998</year>). <article-title>Biogeography, biodiversity and fluid dependence of deep-sea cold-seep communities at active and passive margins.</article-title> <source><italic>Deep Sea Res. Part II Top. Stud. Oceanogr.</italic></source> <volume>45</volume>:<fpage>517</fpage>. <pub-id pub-id-type="doi">10.1016/s0967-0645(97)00074-x</pub-id></citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Simonyan</surname> <given-names>K.</given-names></name> <name><surname>Zisserman</surname> <given-names>A.</given-names></name></person-group> (<year>2014</year>). <article-title>Very deep convolutional networks for large-scale image recognition.</article-title> <source>arXiv</source> <comment>[Preprint].</comment> <volume>arXiv</volume>:<fpage>1409.1556</fpage></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Szegedy</surname> <given-names>C.</given-names></name> <name><surname>Ioffe</surname> <given-names>S.</given-names></name> <name><surname>Vanhoucke</surname> <given-names>V.</given-names></name> <name><surname>Alemi</surname> <given-names>A. A.</given-names></name></person-group> (<year>2017</year>). &#x201C;<article-title>Inception-v4, inception-resnet and the impact of residual connections on learning</article-title>,&#x201D; in <source><italic>Proceedings of the Thirty-First AAAI Conference on Artificial Intelligence</italic></source>, <publisher-loc>Mountain View, CA</publisher-loc>, <fpage>4278</fpage>&#x2013;<lpage>4284</lpage>.</citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Y. Y.</given-names></name> <name><surname>Wang</surname> <given-names>C.</given-names></name> <name><surname>Zhang</surname> <given-names>H.</given-names></name></person-group> (<year>2017</year>). &#x201C;<article-title>Combining single shot multibox detector with transfer learning for ship detection using sentinel-1 images</article-title>,&#x201D; in <source><italic>Proceedings of 2017 Sar in Big Data Era: Models, Methods and Applications</italic></source>, <publisher-loc>Beijing</publisher-loc>.</citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zuazo</surname> <given-names>A.</given-names></name> <name><surname>Grinyo</surname> <given-names>J.</given-names></name> <name><surname>Lopez-Vazquez</surname> <given-names>V.</given-names></name> <name><surname>Rodriguez</surname> <given-names>E.</given-names></name> <name><surname>Costa</surname> <given-names>C.</given-names></name> <name><surname>Ortenzi</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>An automated pipeline for image processing and data treatment to track activity rhythms of <italic>Paragorgia arborea</italic> in relation to hydrographic conditions.</article-title> <source><italic>Sensors</italic></source> <volume>20</volume>:<fpage>6281</fpage>. <pub-id pub-id-type="doi">10.3390/s20216281</pub-id> <pub-id pub-id-type="pmid">33158174</pub-id></citation></ref>
</ref-list>
</back>
</article>