<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Adv. Opt. Technol.</journal-id>
<journal-title>Advanced Optical Technologies</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Adv. Opt. Technol.</abbrev-journal-title>
<issn pub-type="epub">2192-8584</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1474654</article-id>
<article-id pub-id-type="doi">10.3389/aot.2024.1474654</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Advanced Optical Technologies</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>W1-Net: a highly scalable ptychography convolutional neural network</article-title>
<alt-title alt-title-type="left-running-head">Xing et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/aot.2024.1474654">10.3389/aot.2024.1474654</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Xing</surname>
<given-names>Chengye</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2726630/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Lei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2761712/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Mu</surname>
<given-names>Yangyang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2727465/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Yu</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Chang</surname>
<given-names>Guangcai</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Institute of High Energy Physics</institution>, <institution>Chinese Academy of Sciences</institution>, <addr-line>Beijing</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>University of Chinese Academy of Sciences</institution>, <institution>Chinese Academy of Sciences</institution>, <addr-line>Beijing</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Spallation Neutron Source Science Center</institution>, <institution>China Spallation Neutron Source</institution>, <addr-line>Dongguan</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2642870/overview">Yudong Yao</ext-link>, ShanghaiTech University, China</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1640313/overview">Lu Rong</ext-link>, Beijing University of Technology, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1697780/overview">Fucai Zhang</ext-link>, Southern University of Science and Technology, China</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Guangcai Chang, <email>changgc@ihep.ac.cn</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>23</day>
<month>10</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>13</volume>
<elocation-id>1474654</elocation-id>
<history>
<date date-type="received">
<day>02</day>
<month>08</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>11</day>
<month>10</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Xing, Wang, Mu, Li and Chang.</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Xing, Wang, Mu, Li and Chang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>X-ray ptychography is a coherent diffraction imaging technique that allows for the quantitative retrieval of both the amplitude and phase information of a sample in diffraction-limited resolution. However, traditional reconstruction algorithms require a large number of iterations to obtain phase and amplitude images exactly, and the expensive computation precludes real-time imaging. To solve the inverse problem of ptychography data, PtychoNN uses deep convolutional neural networks for real-time imaging. However, its model is relatively simple, and its accuracy is limited by the size of the training dataset, resulting in lower robustness. To address this problem, a series of W-Net neural network models have been proposed which can robustly reconstruct the object phase information from the raw data. Numerical experiments demonstrate that our neural network exhibits better robustness, superior reconstruction capabilities and shorter training time with high-precision ptychography imaging.</p>
</abstract>
<kwd-group>
<kwd>X-ray ptychography</kwd>
<kwd>deep learning</kwd>
<kwd>phase retrieval</kwd>
<kwd>real-time imaging</kwd>
<kwd>W1-net</kwd>
</kwd-group>
<contract-num rid="cn001">No.E32957S3</contract-num>
<contract-num rid="cn002">No.E3545JU2 No.E35451U2</contract-num>
<contract-sponsor id="cn001">Chinese Academy of Sciences<named-content content-type="fundref-id">10.13039/501100002367</named-content>
</contract-sponsor>
<contract-sponsor id="cn002">Institute of High Energy Physics, Chinese Academy of Sciences<named-content content-type="fundref-id">10.13039/501100011181</named-content>
</contract-sponsor>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Ptychography is a technique for coherent diffraction imaging that provides quantitative phase information of a sample in diffraction-limited resolution (<xref ref-type="bibr" rid="B15">Pfeiffer, 2018</xref>). It can image a large number of thick samples in high resolution without complex sample preparation while providing the best observation ability and application potential for materials and biological samples. However, the long time for data acquisition and the expensive computing resources cost for intensive data processing remain significant obstacles. In addition, ptychography is widely used in combination with other optical techniques in various fields such as biomedical (<xref ref-type="bibr" rid="B16">Shemilt et al., 2015</xref>; <xref ref-type="bibr" rid="B2">Bhartiya et al., 2021</xref>), chemical (<xref ref-type="bibr" rid="B1">Beckers et al., 2011</xref>) and metrology (<xref ref-type="bibr" rid="B5">D&#x2019;alfonso et al., 2014</xref>). In conventional experiments, a small aperture or other optical device is used to focus the light probe for scanning the sample. The diffraction pattern at each scanning position is captured by a detector. Adjacent scanning positions require partial overlap to ensure that the recorded experimental data contains sufficient information. However, the detector only aquires intensity while phase information is lost. Therefore, phase retrieval algorithms are needed to recover the phase of the recorded diffraction pattern and reconstruct the sample structure. Traditional phase retrieval algorithms are iterative, such as ePIE (Extended Ptychographic Iterative Engine) (<xref ref-type="bibr" rid="B12">Maiden and Rodenburg, 2009</xref>) and DM (Difference Map) (<xref ref-type="bibr" rid="B18">Thibault et al., 2008</xref>; <xref ref-type="bibr" rid="B17">2009</xref>), which require more supporting conditions and computation time to converge and obtain the real phase information. The inherent principle of these algorithms requires that the overlap between adjacent scanning areas in ptychography experiments should be greater than 50% to obtain better reconstruction results, increasing scanning time and experimental data volume, placed higher demands on the radiation resistance of the sample. The increased amount of data also increases the computational time of traditional iterative algorithms, which places higher demands on the computing hardware. To decreases the computational time, in 2017, Maiden et al. proposed mPIE (<xref ref-type="bibr" rid="B11">Maiden et al., 2017</xref>) based on the idea of momentum gradient descent algorithm in machine learning. After a certain number of iterations, the distribution function update formula of the object under test was added with a momentum term, which significantly reduced the number of iterations and accelerated the convergence speed of the algorithm. Kappeler et al. first proposed building PtychNet (<xref ref-type="bibr" rid="B10">Kappeler et al., 2017</xref>) and other models (<xref ref-type="bibr" rid="B14">Nguyen et al., 2018</xref>; <xref ref-type="bibr" rid="B20">Yan et al., 2020</xref>) based on Convolutional Neural Networks (CNN) for the reconstruction of images in Fourier ptychography (FP). In 2019, <xref ref-type="bibr" rid="B9">I&#x15f;&#x131;l et al. (2019)</xref> constructed a new phase recovery network by combining Deep Neural Networks (DNN) and the Hybrid Input-Output (HIO) (<xref ref-type="bibr" rid="B6">Fienup, 1978</xref>) algorithm. They embedded the DNN network into the iteration process of HIO. In 2020, Cherukara et al. constructed the network PtychoNN (<xref ref-type="bibr" rid="B3">Cherukara et al., 2020</xref>), a deep convolutional neural network, learns the direct mapping from far-field coherent diffraction data to real-space image structure and phase. PtychoNN is hundreds of times faster than Ptycholib (<xref ref-type="bibr" rid="B13">Nashed et al., 2014</xref>) because it understands the direct relationship between diffraction data and image structure and phase. Therefore, data inversion no longer requires overlap constraints, which increases the speed of data acquisition and reconstruction by 5 times (<xref ref-type="bibr" rid="B3">Cherukara et al., 2020</xref>).</p>
</sec>
<sec sec-type="methods" id="s2">
<title>2 Methods</title>
<sec id="s2-1">
<title>2.1 Neural networks</title>
<p>The network architecture of PtychoNN is designed to allow a single network to predict both amplitude and phase, thus minimizing the number of network weights that need to be learned. This network only uses convolutional and up/downsampling layers (without dense layers) to keep the number of network weights minimum, improving the speed of training and prediction (<xref ref-type="bibr" rid="B3">Cherukara et al., 2020</xref>). However, the relationship between the number of network weights and the speed of network training is not simply linear. Therefore, we took inspiration from ConvNext V2 (<xref ref-type="bibr" rid="B19">Woo et al., 2023</xref>), Squeeze-and-Excitation Networks (<xref ref-type="bibr" rid="B8">Hu et al., 2018</xref>) and developed the W1-Net model.</p>
<p>
<xref ref-type="fig" rid="F1">Figure 1</xref> shows the architecture of W1-Net.The W1-network architecture consists of an encoder and two decoders, enabling a single network to predict both amplitude and phase. In comparison to PtychoNN, W1-Net primarily focuses on increasing the depth of the encoder network and introducing residual networks and channel attention mechanisms. The enhancement of feature extraction capability and expressive power is achieved through increasing the network depth. With the increase in network depth, the network can learn more complex features. Shallow networks may only capture low-level features such as edges and textures in images, while deep networks can learn more abstract high-level features, such as parts and overall structures of objects. Deep networks capture the inherent structure and patterns in the data through hierarchical abstraction, thereby enabling more accurate predictions. The introduction of residual networks aims to address issues such as gradient vanishing or exploding that may arise with increasing model depth, thereby avoiding degradation problems as the number of layers increases. By embedding learning mechanisms, the model captures spatial correlations and improve network performance. The channel attention mechanism (SE block) adaptively recalibrates channel-wise feature responses by explicitly modeling interdependencies between channels. The encoder&#x2019;s core consists of a convolutional layer, three downsample layers, four ConvNext blocks (stacked in a 2:2:4:2 manner), and three SE blocks. The convolutional layer and downsample layers aim to decrease image size, thereby reducing computation time and workload. The decoder comprises upsample and convolutional layers, with bilinear interpolation used in the upsample layer to reduce computation time and workload. Additionally, double convolution and batch normalization are employed to prevent overfitting. To achieve a wider field of view, a larger kernel size is utilized in the ConvNext block and the first convolutional layer of the encoder. Furthermore, SE blocks optimize the weights between channels, and a new activation function is utilized to improve training results.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Architecture of W1-Net, a deep convolutional neural network.</p>
</caption>
<graphic xlink:href="aot-13-1474654-g001.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="results|discussion" id="s3">
<title>3 Experimental results and discussions</title>
<sec id="s3-1">
<title>3.1 Training configuration</title>
<p>To train and evaluate the W1-Net network, we utilized the dataset provided by (<xref ref-type="bibr" rid="B3">Cherukara et al., 2020</xref>), which consisted of 16,100 triplets of raw coherent diffraction data, real-space amplitude, and phase images obtained from the first 100 scans of an experimental natural material structure conducted on the X-ray nano-probe beamline at the Advanced Photon Source 26ID. The scanning step was 30&#xa0;nm over 161 <inline-formula id="inf1">
<mml:math id="m1">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 161 points, with a 50% spatial overlap, and the training dataset were split 90&#x2013;10 into training and validation. The weights of W1-Net were updated using adaptive moment estimation (ADAM) to minimize the mean absolute error (MAE) per pixel, with an initial learning rate of 0.001.</p>
<p>The W1-Net network was trained on PyTorch, using an Intel Core i7-6700 CPU and an NVIDIA GeForce RTX 3060 GPU. To evaluate the performance of the model, we compared the experimental results of PtychoNN and W1-Net, using peak signal-to-noise ratio (PSNR) (<xref ref-type="bibr" rid="B7">Hor&#xe9; and Ziou, 2010</xref>), mean squared error (MSE) (<xref ref-type="bibr" rid="B7">Hor&#xe9; and Ziou, 2010</xref>), and structural similarity index (SSIM) as quantitative indicators for a comprehensive analysis of the models.</p>
</sec>
<sec id="s3-2">
<title>3.2 Experiment results</title>
<sec id="s3-2-1">
<title>3.2.1 Single-shot experiment results</title>
<p>
<xref ref-type="fig" rid="F2">Figure 2</xref> shows single-shot examples of the performance of PtychoNN and W1-Net on data from the test region of the experimental scan.We can observe that by using our W1-Net network, we are able to reconstruct the fine details of objects more completely, especially in terms of reconstructing edge information. In contrast, the reconstruction results of PtychoNN lose a lot of edge information. Furthermore, from our data <xref ref-type="table" rid="T1">Tables 1</xref>, <xref ref-type="table" rid="T2">2</xref>, it is clear that W1-Net exhibits higher peak signal-to-noise ratio (PSNR), structural similarity index (SSIM), and lower mean squared error (MSE) for these representative scanning points.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Single-shot predictions. <bold>(A)</bold> Input diffraction at different scan points, <bold>(B)</bold> predicted by PtychoNN, <bold>(C)</bold> predicted by W1-Net, <bold>(D)</bold> Ground-truth.Visually, our W1-Net achieves better results compared to PtychoNN.</p>
</caption>
<graphic xlink:href="aot-13-1474654-g002.tif"/>
</fig>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Amplitude of single-shot predictions.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Scan point</th>
<th align="left">Models</th>
<th align="left">MSE</th>
<th align="left">PSNR (dB)</th>
<th align="left">SSIM</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center" rowspan="2">P1</td>
<td align="center">PtychoNN</td>
<td align="center">
<inline-formula id="inf2">
<mml:math id="m2">
<mml:mrow>
<mml:mn>1.014</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">39.940</td>
<td align="center">0.9803</td>
</tr>
<tr>
<td align="center">W1-Net</td>
<td align="center">
<inline-formula id="inf3">
<mml:math id="m3">
<mml:mrow>
<mml:mn>8.620</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>5</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">40.645</td>
<td align="center">0.9830</td>
</tr>
<tr>
<td align="center" rowspan="2">P2</td>
<td align="center">PtychoNN</td>
<td align="center">
<inline-formula id="inf4">
<mml:math id="m4">
<mml:mrow>
<mml:mn>9.769</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>5</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">40.102</td>
<td align="center">0.9792</td>
</tr>
<tr>
<td align="center">W1-Net</td>
<td align="center">
<inline-formula id="inf5">
<mml:math id="m5">
<mml:mrow>
<mml:mn>1.234</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">39.088</td>
<td align="center">0.9749</td>
</tr>
<tr>
<td align="center" rowspan="2">P3</td>
<td align="center">PtychoNN</td>
<td align="center">
<inline-formula id="inf6">
<mml:math id="m6">
<mml:mrow>
<mml:mn>1.045</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">39.808</td>
<td align="center">0.9831</td>
</tr>
<tr>
<td align="center">W1-Net</td>
<td align="center">
<inline-formula id="inf7">
<mml:math id="m7">
<mml:mrow>
<mml:mn>6.707</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>5</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">41.735</td>
<td align="center">0.9866</td>
</tr>
<tr>
<td align="center" rowspan="2">P4</td>
<td align="center">PtychoNN</td>
<td align="center">7.311<inline-formula id="inf8">
<mml:math id="m8">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>10<sup>&#x2013;5</sup>
</td>
<td align="center">41.360</td>
<td align="center">0.9839</td>
</tr>
<tr>
<td align="center">W1-Net</td>
<td align="center">8.914<inline-formula id="inf9">
<mml:math id="m9">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>10<sup>&#x2013;5</sup>
</td>
<td align="center">40.499</td>
<td align="center">0.9806</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Phase of single shot-predictions.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Scan point</th>
<th align="center">Models</th>
<th align="center">MSE</th>
<th align="center">PSNR (dB)</th>
<th align="center">SSIM</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center" rowspan="2">P1</td>
<td align="center">PtychoNN</td>
<td align="center">0.4118</td>
<td align="center">51.984</td>
<td align="center">0.9719</td>
</tr>
<tr>
<td align="center">W1-Net</td>
<td align="center">0.2427</td>
<td align="center">54.280</td>
<td align="center">0.9843</td>
</tr>
<tr>
<td align="center" rowspan="2">P2</td>
<td align="center">PtychoNN</td>
<td align="center">0.5274</td>
<td align="center">50.910</td>
<td align="center">0.9573</td>
</tr>
<tr>
<td align="center">W1-Net</td>
<td align="center">0.3076</td>
<td align="center">53.251</td>
<td align="center">0.9748</td>
</tr>
<tr>
<td align="center" rowspan="2">P3</td>
<td align="center">PtychoNN</td>
<td align="center">0.5580</td>
<td align="center">50.664</td>
<td align="center">0.9526</td>
</tr>
<tr>
<td align="center">W1-Net</td>
<td align="center">0.2730</td>
<td align="center">53.770</td>
<td align="center">0.9819</td>
</tr>
<tr>
<td align="center" rowspan="2">P4</td>
<td align="center">PtychoNN</td>
<td align="center">0.3093</td>
<td align="center">53.228</td>
<td align="center">0.9777</td>
</tr>
<tr>
<td align="center">W1-Net</td>
<td align="center">0.2480</td>
<td align="center">54.186</td>
<td align="center">0.9787</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>These metrics are important standards for measuring the quality of image reconstruction. A higher PSNR value indicates less noise difference between the reconstructed image and the original image, a higher SSIM value indicates higher structural similarity between the reconstructed image and the original image, and a lower MSE value means a smaller overall error between the reconstructed image and the original image.</p>
<p>Because, in the experiment, the detector only obtains the intensity and loses the phase information, so we pay more attention to phase retrieval. Therefore, based on these results, we can conclude that our W1-Net network performs better in reconstructing object details and edge information, and achieves better performance than PtychoNN across multiple metrics of phase reconstruction.</p>
</sec>
<sec id="s3-2-2">
<title>3.2.2 Effect of training data size on performance</title>
<p>The training of neural networks requires a large amount of training data and computational resources. The quantity and size of training samples directly affect the training time and model accuracy. Therefore, we conducted a performance evaluation of W1-Net and PtychoNN using the same training data.</p>
<p>The results showed <xref ref-type="fig" rid="F3">Figure 3</xref>, <xref ref-type="fig" rid="F4">4</xref> that W1-Net outperforms PtychoNN in terms of reconstruction quality with the same training data. Particularly, W1-Net performs well even with fewer training samples, indicating its better robustness. This allows us to train W1-Net with less training data, reducing the demand for computational resources.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Effect of training data size in amplitude recovery. Images from the left to right show the performance of different models when trained on progressively fewer training samples.</p>
</caption>
<graphic xlink:href="aot-13-1474654-g003.tif"/>
</fig>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Effect of training data size in phase recovery. Images from the left to right show the performance of different models when trained on progressively fewer training samples.</p>
</caption>
<graphic xlink:href="aot-13-1474654-g004.tif"/>
</fig>
</sec>
<sec id="s3-2-3">
<title>3.2.3 Effect of training epochs on performance</title>
<p>Furthermore, a robust network should exhibit relatively positive test results and faster convergence speed across different training epochs.</p>
<p>The results showed in <xref ref-type="table" rid="T3">Table 3</xref> that W1-Net has lower mean squared error (MSE) and higher structural similarity index (SSIM) within the same training epochs. This means that W1-Net can converge faster during the training process and achieve relatively positive test results at each training epoch.</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Results of different training epochs.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Epoch</th>
<th align="center">Models</th>
<th align="center">MSE (Amplitude)</th>
<th align="center">MSE (Phase)</th>
<th align="center">SSIM(Amplitude)</th>
<th align="center">SSIM(Phase)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center" rowspan="2">10</td>
<td align="center">PtychoNN</td>
<td align="center">
<inline-formula id="inf10">
<mml:math id="m10">
<mml:mrow>
<mml:mn>5.12</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">0.0910</td>
<td align="center">0.9872</td>
<td align="center">0.9930</td>
</tr>
<tr>
<td align="center">W1-Net</td>
<td align="center">
<inline-formula id="inf11">
<mml:math id="m11">
<mml:mrow>
<mml:mn>4.78</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">0.0728</td>
<td align="center">0.9879</td>
<td align="center">0.9946</td>
</tr>
<tr>
<td align="center" rowspan="2">20</td>
<td align="center">PtychoNN</td>
<td align="center">
<inline-formula id="inf12">
<mml:math id="m12">
<mml:mrow>
<mml:mn>4.00</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">0.0894</td>
<td align="center">0.9897</td>
<td align="center">0.9929</td>
</tr>
<tr>
<td align="center">W1-Net</td>
<td align="center">
<inline-formula id="inf13">
<mml:math id="m13">
<mml:mrow>
<mml:mn>3.97</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">0.0753</td>
<td align="center">0.9897</td>
<td align="center">0.9952</td>
</tr>
<tr>
<td align="center" rowspan="2">40</td>
<td align="center">PtychoNN</td>
<td align="center">
<inline-formula id="inf14">
<mml:math id="m14">
<mml:mrow>
<mml:mn>4.07</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">0.0928</td>
<td align="center">0.9894</td>
<td align="center">0.9924</td>
</tr>
<tr>
<td align="center">W1-Net</td>
<td align="center">
<inline-formula id="inf15">
<mml:math id="m15">
<mml:mrow>
<mml:mn>3.96</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">0.0770</td>
<td align="center">0.9896</td>
<td align="center">0.9946</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>In conclusion, our W1-Net network demonstrates better reconstruction performance, better robustness, and faster convergence speed with the same training data. This makes it a promising choice for achieving high-quality image reconstruction in resource-constrained scenarios.</p>
</sec>
<sec id="s3-2-4">
<title>3.2.4 Scalability of the model</title>
<p>Our results demonstrated that W1-Net outperformed PtychoNN in terms of accuracy, despite having a larger number of parameters and model size.Moreover, In addition, we tested the W2-Net <xref ref-type="fig" rid="F5">Figure 5</xref> and W3-net <xref ref-type="fig" rid="F6">Figure 6</xref> models based on W1-Net by changing the number of filters, the number of stacked blocks and other minor adjustments.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Architecture of W2-Net, a deep convolutional neural network that based on W1-Net.</p>
</caption>
<graphic xlink:href="aot-13-1474654-g005.tif"/>
</fig>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Architecture of W3-Net, a lightweight and efficient network that based on W1-Net.</p>
</caption>
<graphic xlink:href="aot-13-1474654-g006.tif"/>
</fig>
<p>By replaced Convolution with Depthwise Convolution (<xref ref-type="bibr" rid="B4">Chollet, 2017</xref>) and reduced the number of convolutional layers, filters and ReLu, W3-Net achieved the same reconstruction precision, and the parameters were only 8.26 percent of PtychoNN. Greatly reduced inference time from 21.437&#xa0;ms for PtychoNN to 15.823&#xa0;ms for W3-Net and alleviated hardware requirements on real-time ptychographic imaging.</p>
<p>Under the same data set for 60 epoch, the results shown in the <xref ref-type="fig" rid="F7">Figure 7</xref> and <xref ref-type="table" rid="T4">Tables 4</xref>, <xref ref-type="table" rid="T5">5</xref> showed that the W-series network shows better reconstruction performance. Additionally, W1-Net produced fewer noticeable artifacts or blurs, resulting in faster and more precise data reconstruction. W2-Net shows superior performance in phase recovery. W3-Net had a faster training speed and proposed a lightweight and efficient network model.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Different models results. <bold>(A)</bold>: Ground-truth; <bold>(B)</bold>: PtychoNN; <bold>(C)</bold>: W3-Net; <bold>(D)</bold>: W1-Net; <bold>(E)</bold>: W2-Net. Visually, the reconstruction results improve progressively from left to right.</p>
</caption>
<graphic xlink:href="aot-13-1474654-g007.tif"/>
</fig>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Performance comparison of the three models on the same dataset.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Models</th>
<th align="center">PSNR (Amplitude)(dB)</th>
<th align="center">PSNR (Phase)(dB)</th>
<th align="center">SSIM(Amplitude)</th>
<th align="center">SSIM(Phase)</th>
<th align="center">EVA (Phase)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">W1-Net</td>
<td align="center">44.027</td>
<td align="center">59.211</td>
<td align="center">0.9897</td>
<td align="center">0.9941</td>
<td align="center">0.855</td>
</tr>
<tr>
<td align="center">W3-Net</td>
<td align="center">43.981</td>
<td align="center">58.959</td>
<td align="center">0.9897</td>
<td align="center">0.9939</td>
<td align="center">0.869</td>
</tr>
<tr>
<td align="center">PtychoNN</td>
<td align="center">43.721</td>
<td align="center">58.559</td>
<td align="center">0.9890</td>
<td align="center">0.9930</td>
<td align="center">0.832</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>Reconstructed results of different models.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Models</th>
<th align="center">Param/Thousand</th>
<th align="center">FLOPs (G)</th>
<th align="center">MSE (Amplitude)</th>
<th align="center">MSE (Phase)</th>
<th align="center">Inference time (ms)</th>
<th align="center">Training time (s)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">W2-Net</td>
<td align="center">6656</td>
<td align="center">435.99</td>
<td align="center">
<inline-formula id="inf16">
<mml:math id="m16">
<mml:mrow>
<mml:mn>3.89</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>5</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">0.0590</td>
<td align="center">96.704</td>
<td align="center">5014</td>
</tr>
<tr>
<td align="center">W1-Net</td>
<td align="center">1780</td>
<td align="center">60.77</td>
<td align="center">
<inline-formula id="inf17">
<mml:math id="m17">
<mml:mrow>
<mml:mn>3.96</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>5</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">0.0780</td>
<td align="center">29.906</td>
<td align="center">1299</td>
</tr>
<tr>
<td align="center">W3-Net</td>
<td align="center">103</td>
<td align="center">10.77</td>
<td align="center">
<inline-formula id="inf18">
<mml:math id="m18">
<mml:mrow>
<mml:mn>4.00</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>5</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">0.0826</td>
<td align="center">15.823</td>
<td align="center">897</td>
</tr>
<tr>
<td align="center">PtychoNN</td>
<td align="center">1247</td>
<td align="center">154.86</td>
<td align="center">
<inline-formula id="inf19">
<mml:math id="m19">
<mml:mrow>
<mml:mn>4.25</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>5</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">0.0906</td>
<td align="center">21.437</td>
<td align="center">1326</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
</sec>
<sec sec-type="conclusion" id="s4">
<title>4 Conclusion</title>
<p>In this paper, we introduce a series of novel W-Net model including a lightweight network W3-Net that effectively addresses the phase and amplitude reconstruction problems in ptychography. Compared to PtychoNN, our W1-Net model not only requires less training time but also exhibits superior reconstruction results. Specifically, our model achieves lower mean squared error (MSE) and higher structural similarity index (SSIM) in phase reconstruction. This indicates that our W1-Net model can accurately recover the phase information of the images.</p>
<p>Furthermore, our W1-Net model demonstrates higher scalability. We demonstrate in our study that the W2-Net model achieves better recovery results when sufficient computational resources and hardware are available. W3-Net reduced inference time and hardware requirements on real-time ptychographic imaging.This further confirms the scalability and adaptability of the W1-Net model.</p>
<p>In summary, our research presents a novel W-Net model, namely, W1-Net, for solving the phase reconstruction problems in ptychography. Compared to traditional PtychoNN methods, our model offers significant advantages in terms of training time, reconstruction performance, and scalability. This provides a more efficient, accurate, and scalable solution for research and practical applications in the field of ptychography.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s5">
<title>Data availability statement</title>
<p>Publicly available datasets were analyzed in this study. This data can be found here: <ext-link ext-link-type="uri" xlink:href="https://github.com/mcherukara/PtychoNN">https://github.com/mcherukara/PtychoNN</ext-link>.</p>
</sec>
<sec id="s6">
<title>Author contributions</title>
<p>CX: Conceptualization, Data curation, Formal Analysis, Investigation, Methodology, Resources, Software, Validation, Visualization, Writing&#x2013;original draft, Writing&#x2013;review and editing. LW: Conceptualization, Funding acquisition, Methodology, Resources, Software, Supervision, Validation, Visualization, Writing&#x2013;review and editing. YM: Formal Analysis, Resources, Supervision, Writing&#x2013;review and editing. YL: Writing&#x2013;review and editing. GC: Project administration, Supervision, Writing&#x2013;review and editing.</p>
</sec>
<sec sec-type="funding-information" id="s7">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research, authorship, and/or publication of this article. This work was supported by the Scientific and Technological Innovation project of Institute of High Energy Physics, Chinese Academy of Sciences (No. E35451U2); The National Natural Science Foundation of China (22027810); The Scientific and Technological Innovation project of Institute of High Energy Physics, Chinese Academy of Sciences (No. E3545JU2); The Network Security and Informatization Project of the Chinese Academy of Sciences (No. E32957S3).</p>
</sec>
<ack>
<p>The authors express their gratitude to all colleagues who facilitated access to and provided assistance during the experiments.</p>
</ack>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Beckers</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Senkbeil</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Gorniak</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Reese</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Giewekemeyer</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Gleber</surname>
<given-names>S.-C.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>Chemical contrast in soft x-ray ptychography</article-title>. <source>Phys. Rev. Lett.</source> <volume>107</volume>, <fpage>208101</fpage>. <pub-id pub-id-type="doi">10.1103/physrevlett.107.208101</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bhartiya</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Batey</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Cipiccia</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Rau</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Botchway</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>X-ray ptychography imaging of human chromosomes after low-dose irradiation</article-title>. <source>Chromosome Res.</source> <volume>29</volume>, <fpage>107</fpage>&#x2013;<lpage>126</lpage>. <pub-id pub-id-type="doi">10.1007/s10577-021-09660-7</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cherukara</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Nashed</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Enfedaque</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Hexemer</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Harder</surname>
<given-names>R. J.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Ai-enabled high-resolution scanning coherent diffraction imaging</article-title>. <source>Appl. Phys. Lett.</source> <volume>117</volume>. <pub-id pub-id-type="doi">10.1063/5.0013065</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Chollet</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2017</year>). <source>Xception: deep learning with depthwise separable convolutions</source>, <fpage>1251</fpage>&#x2013;<lpage>1258</lpage>.</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>D&#x2019;alfonso</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Morgan</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Sawada</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Kirkland</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Deterministic electron ptychography at atomic resolution</article-title>. <source>Phys. Rev. B</source> <volume>89</volume>, <fpage>064101</fpage>. <pub-id pub-id-type="doi">10.1103/physrevb.89.064101</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fienup</surname>
<given-names>J. R.</given-names>
</name>
</person-group> (<year>1978</year>). <article-title>Reconstruction of an object from the modulus of its fourier transform</article-title>. <source>Opt. Lett.</source> <volume>3</volume>, <fpage>27</fpage>&#x2013;<lpage>29</lpage>. <pub-id pub-id-type="doi">10.1364/ol.3.000027</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hor&#xe9;</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ziou</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Image quality metrics: psnr vs. ssim, 2366&#x2013;2369</article-title>. <pub-id pub-id-type="doi">10.1109/ICPR.2010.579</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Hu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2018</year>). &#x201c;<article-title>Squeeze-and-excitation networks</article-title>,&#x201d; in <source>Proceedings of the IEEE conference on computer vision and pattern recognition</source>, <fpage>7132</fpage>&#x2013;<lpage>7141</lpage>.</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>I&#x15f;&#x131;l</surname>
<given-names>&#xc7;.</given-names>
</name>
<name>
<surname>Oktem</surname>
<given-names>F. S.</given-names>
</name>
<name>
<surname>Ko&#xe7;</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Deep iterative reconstruction for phase retrieval</article-title>. <source>Appl. Opt.</source> <volume>58</volume>, <fpage>5422</fpage>&#x2013;<lpage>5431</lpage>. <pub-id pub-id-type="doi">10.1364/ao.58.005422</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Kappeler</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ghosh</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Holloway</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Cossairt</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Katsaggelos</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2017</year>). &#x201c;<article-title>Ptychnet: cnn based fourier ptychography</article-title>,&#x201d; in <source>2017 IEEE international conference on image processing (ICIP)</source> (<publisher-name>IEEE</publisher-name>), <fpage>1712</fpage>&#x2013;<lpage>1716</lpage>.</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Maiden</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Johnson</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Further improvements to the ptychographical iterative engine</article-title>. <source>Optica</source> <volume>4</volume>, <fpage>736</fpage>&#x2013;<lpage>745</lpage>. <pub-id pub-id-type="doi">10.1364/optica.4.000736</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Maiden</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Rodenburg</surname>
<given-names>J. M.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>An improved ptychographical phase retrieval algorithm for diffractive imaging</article-title>. <source>Ultramicroscopy</source> <volume>109</volume>, <fpage>1256</fpage>&#x2013;<lpage>1262</lpage>. <pub-id pub-id-type="doi">10.1016/j.ultramic.2009.05.012</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nashed</surname>
<given-names>Y. S.</given-names>
</name>
<name>
<surname>Vine</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Peterka</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ross</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Jacobsen</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Parallel ptychographic reconstruction</article-title>. <source>Opt. express</source> <volume>22</volume>, <fpage>32082</fpage>&#x2013;<lpage>32097</lpage>. <pub-id pub-id-type="doi">10.1364/oe.22.032082</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nguyen</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Xue</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Tian</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Nehmetallah</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Deep learning approach for fourier ptychography microscopy</article-title>. <source>Opt. express</source> <volume>26</volume>, <fpage>26470</fpage>&#x2013;<lpage>26484</lpage>. <pub-id pub-id-type="doi">10.1364/oe.26.026470</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pfeiffer</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>X-ray ptychography</article-title>. <source>Nat. Photonics</source> <volume>12</volume>, <fpage>9</fpage>&#x2013;<lpage>17</lpage>. <pub-id pub-id-type="doi">10.1038/s41566-017-0072-5</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shemilt</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Verbanis</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Schwenke</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Estandarte</surname>
<given-names>A. K.</given-names>
</name>
<name>
<surname>Xiong</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Harder</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Karyotyping human chromosomes by optical and x-ray ptychography methods</article-title>. <source>Biophysical J.</source> <volume>108</volume>, <fpage>706</fpage>&#x2013;<lpage>713</lpage>. <pub-id pub-id-type="doi">10.1016/j.bpj.2014.11.3456</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thibault</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Dierolf</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bunk</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Menzel</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Pfeiffer</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Probe retrieval in ptychographic coherent diffractive imaging</article-title>. <source>Ultramicroscopy</source> <volume>109</volume>, <fpage>338</fpage>&#x2013;<lpage>343</lpage>. <pub-id pub-id-type="doi">10.1016/j.ultramic.2008.12.011</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thibault</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Dierolf</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Menzel</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Bunk</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>David</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Pfeiffer</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>High-resolution scanning x-ray diffraction microscopy</article-title>. <source>Science</source> <volume>321</volume>, <fpage>379</fpage>&#x2013;<lpage>382</lpage>. <pub-id pub-id-type="doi">10.1126/science.1158573</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Woo</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Debnath</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Kweon</surname>
<given-names>I. S.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). &#x201c;<article-title>Convnext v2: Co-designing and scaling convnets with masked autoencoders</article-title>,&#x201d; in <source>Proceedings of the IEEE/CVF conference on computer vision and pattern recognition</source>, <fpage>16133</fpage>&#x2013;<lpage>16142</lpage>.</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yan</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Gan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>Z.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>The global survival rate among adult out-of-hospital cardiac arrest patients who received cardiopulmonary resuscitation: a systematic review and meta-analysis</article-title>. <source>Crit. care</source> <volume>24</volume>, <fpage>61</fpage>&#x2013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1186/s13054-020-2773-2</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>