<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mol. Biosci.</journal-id>
<journal-title>Frontiers in Molecular Biosciences</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mol. Biosci.</abbrev-journal-title>
<issn pub-type="epub">2296-889X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">874475</article-id>
<article-id pub-id-type="doi">10.3389/fmolb.2022.874475</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Molecular Biosciences</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Artificial Intelligence Assisting the Early Detection of Active Pulmonary Tuberculosis From Chest X-Rays: A Population-Based Study</article-title>
<alt-title alt-title-type="left-running-head">Nijiati et al.</alt-title>
<alt-title alt-title-type="right-running-head">Tuberculosis Diagnosis AI Study</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Nijiati</surname>
<given-names>Mayidili</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ma</surname>
<given-names>Jie</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Hu</surname>
<given-names>Chuling</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1676184/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Tuersun</surname>
<given-names>Abudouresuli</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Abulizi</surname>
<given-names>Abudoukeyoumujiang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Kelimu</surname>
<given-names>Abudoureyimu</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Dongyu</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Li</surname>
<given-names>Guanbin</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Zou</surname>
<given-names>Xiaoguang</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/739377/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Radiology</institution>, <institution>The First People&#x2019;s Hospital of Kashi Prefecture</institution>, <addr-line>Kashi</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>School of Computer Science and Engineering</institution>, <institution>Sun Yat-sen University</institution>, <addr-line>Guangzhou</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Department of Colorectal Surgery</institution>, <institution>The Sixth Affiliated Hospital</institution>, <institution>Sun Yat-sen University</institution>, <addr-line>Guangzhou</addr-line>, <country>China</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Department of Radiology</institution>, <institution>Kashi Area Tuberculosis Control Center</institution>, <addr-line>Kashi</addr-line>, <country>China</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Clinical Medical Research Center</institution>, <institution>The First People&#x2019;s Hospital of Kashi Prefecture</institution>, <addr-line>Kashi</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/329785/overview">Xin Gao</ext-link>, King Abdullah University of Science and Technology, Saudi Arabia</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1694915/overview">Xiaohan Xing</ext-link>, City University of Hong Kong, Hong Kong SAR, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1109187/overview">Jun Cheng</ext-link>, Shenzhen University, China</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Mayidili Nijiati, <email>1376906729@qq.com</email>; Guanbin Li, <email>liguanbin@mail.sysu.edu.cn</email>; Xiaoguang Zou, <email>zxgks@163.com</email>
</corresp>
<fn fn-type="equal" id="fn1">
<label>
<sup>&#x2020;</sup>
</label>
<p>These authors have contributed equally to this work and share first authorship</p>
</fn>
<fn fn-type="other">
<p>This article was submitted to Molecular Diagnostics and Therapeutics, a section of the journal Frontiers in Molecular Biosciences</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>08</day>
<month>04</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>9</volume>
<elocation-id>874475</elocation-id>
<history>
<date date-type="received">
<day>12</day>
<month>02</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>08</day>
<month>03</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 Nijiati, Ma, Hu, Tuersun, Abulizi, Kelimu, Zhang, Li and Zou.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Nijiati, Ma, Hu, Tuersun, Abulizi, Kelimu, Zhang, Li and Zou</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>As a major infectious disease, <italic>tuberculosis</italic> (TB) still poses a threat to people&#x2019;s health in China. As a triage test for TB, reading chest radiography with traditional approach ends up with high inter-radiologist and intra-radiologist variability, moderate specificity and a waste of time and medical resources. Thus, this study established a deep convolutional neural network (DCNN) based artificial intelligence (AI) algorithm, aiming at diagnosing TB on posteroanterior chest X-ray photographs in an effective and accurate way. Altogether, 5,000 patients with TB and 4,628 patients without TB were included in the study, totaling to 9,628 chest X-ray photographs analyzed. Splitting the radiographs into a training set (80.4%) and a testing set (19.6%), three different DCNN algorithms, including ResNet, VGG, and AlexNet, were trained to classify the chest radiographs as images of pulmonary TB or without TB. Both the diagnostic accuracy and the area under the receiver operating characteristic curve were used to evaluate the performance of the three AI diagnosis models. Reaching an accuracy of 96.73% and marking the precise TB regions on the radiographs, ResNet algorithm-based AI outperformed the rest models and showed excellent diagnostic ability in different clinical subgroups in the stratification analysis. In summary, the ResNet algorithm-based AI diagnosis system provided accurate TB diagnosis, which could have broad prospects in clinical application for TB diagnosis, especially in poor regions with high TB incidence.</p>
</abstract>
<kwd-group>
<kwd>tuberculosis</kwd>
<kwd>chest radiograph</kwd>
<kwd>machine learning</kwd>
<kwd>artificial intelligence</kwd>
<kwd>deep convolutional neural network</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>Causing by <italic>Mycobacterium tuberculosis</italic> infection, pulmonary <italic>tuberculosis</italic> (TB) is a kind of dangerous airborne chronic respiratory infectious disease (<xref ref-type="bibr" rid="B8">Ragonnet et al., 2019</xref>). TB still remains a major problem of disease control and poses a threat to the health of the public in China (<xref ref-type="bibr" rid="B12">Tusun et al., 2021</xref>). The incidence of TB in Kashi was 250.4/100,000 in 2020, reaching 4.3 times the national average incidence. TB epidemic remains severe, especially in 12 counties/cities of Kashi prefecture, Xinjiang Uygur Autonomous Region (<xref ref-type="bibr" rid="B12">Tusun et al., 2021</xref>).</p>
<p>A triage test using chest radiography is utilized for patients with typical symptoms for TB or TB-related risk factors (<xref ref-type="bibr" rid="B6">Qin et al., 2021a</xref>). Both the shortage of experienced radiologist and the high inter-radiologist and intra-radiologist variability have been affecting the performance and generalizability of the chest radiography, especially in places with a high incidence of TB and without access to high quality medical service (<xref ref-type="bibr" rid="B4">Organization, 2016</xref>). However, during the last 10&#xa0;years, the artificial intelligence (AI) aided diagnostics systems have been developing and evolving at an unprecedented pace, leading to its deployment and usage in clinical settings, and many medical image analyzing AI algorithms, which were based on deep learning and deep convolutional neural networks (DCNNs), were being utilized for radiographs reading at the same time (<xref ref-type="bibr" rid="B9">Rajpurkar et al., 2020</xref>; <xref ref-type="bibr" rid="B7">Qin et al., 2021b</xref>). Such deep learning and DCNN algorithms are able to distinguish the features and characteristics of the TB-related abnormalities in the chest X -ray photographs. Considering the great improvement of AI-assisted TB diagnosis, computer aided TB screening software is a better substitute for physicians in digital chest radiographs reading and analyzing, which was recommended by the updated guidelines of the World Health Organization (WHO) in March 2021 (<xref ref-type="bibr" rid="B5">Organization, 2021</xref>). However, there remains uncertain about what kind of algorithm or AI should be developed and put into clinical practice, since the WHO didn&#x2019;t give detailed recommendations for specific products (<xref ref-type="bibr" rid="B6">Qin et al., 2021a</xref>).</p>
<p>To date, the majority of AI algorithms for TB diagnosis have been based on small groups of individuals. Considering that a large sample for training would further improve the performance of the AI algorithm, the deep convolutional neural network (DCNN), a kind of deep learning approach, has been widely utilized for analyzing medical images. Thus, this study explored the TB diagnosis ability of three kinds of DCNNs (Resnet, VGG, and AlexNet algorithms) based on chest X-rays of 10,000 individuals.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>Materials and Methods</title>
<sec id="s2-1">
<title>Study Setting and Population</title>
<p>In this retrospective study, we trained convolutional neural network-based AI algorithms to read chest X-rays for pulmonary TB diagnosis. The workflow of the study was showed in <xref ref-type="fig" rid="F1">Figure 1</xref>. In total, 9628 X-ray images and corresponding clinical information were collected from individuals with and without TB in Kashgar, Xinjiang, China, between 2019 and 2020 (<xref ref-type="table" rid="T1">Table 1</xref>). The included cases were aged &#x2265;15&#xa0;years and underwent X-ray analysis. TB cases were diagnosed by experienced physicians based on the symptoms and the results of multiple tests and radiological examinations, including sputum culture or smear tests, Xpert tests, chest X-ray films, interferon gamma release assays and tuberculin skin tests and so on. In total, 5,000 images of TB cases and 4,628 images of non-TB cases were collected with privacy information removed and split into the training (<italic>n</italic> &#x3d; 7,703) and testing sets (<italic>n</italic> &#x3d; 1925) (<xref ref-type="table" rid="T1">Table 1</xref>).</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>The workflow of the study.</p>
</caption>
<graphic xlink:href="fmolb-09-874475-g001.tif"/>
</fig>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>A summary of clinical characteristics of training and testing sets.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="left"/>
<th colspan="2" align="center">Training set</th>
<th colspan="2" align="center">Testing set</th>
</tr>
<tr>
<th align="center">TB cases</th>
<th align="center">Non-TB cases</th>
<th align="center">TB cases</th>
<th align="center">Non-TB cases</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td colspan="5" align="left">Sex</td>
</tr>
<tr>
<td align="left">&#x2003;Female</td>
<td align="center">2,118</td>
<td align="center">1885</td>
<td align="center">463</td>
<td align="center">478</td>
</tr>
<tr>
<td align="left">&#x2003;Male</td>
<td align="center">1882</td>
<td align="center">1818</td>
<td align="center">537</td>
<td align="center">447</td>
</tr>
<tr>
<td colspan="5" align="left">Age</td>
</tr>
<tr>
<td align="left">&#x2003;&#x3c;65&#xa0;years</td>
<td align="center">2,297</td>
<td align="center">1971</td>
<td align="center">461</td>
<td align="center">580</td>
</tr>
<tr>
<td align="left">&#x2003;&#x2265;65&#xa0;years</td>
<td align="center">1703</td>
<td align="center">1732</td>
<td align="center">539</td>
<td align="center">345</td>
</tr>
<tr>
<td colspan="5" align="left">Symptoms</td>
</tr>
<tr>
<td align="left">&#x2003;Cough</td>
<td align="center">3,304</td>
<td align="center">6</td>
<td align="center">782</td>
<td align="center">8</td>
</tr>
<tr>
<td align="left">&#x2003;Expectoration</td>
<td align="center">2,726</td>
<td align="center">4</td>
<td align="center">606</td>
<td align="center">1</td>
</tr>
<tr>
<td align="left">&#x2003;Hemoptysis</td>
<td align="center">461</td>
<td align="center">5</td>
<td align="center">128</td>
<td align="center">4</td>
</tr>
<tr>
<td align="left">&#x2003;Fever</td>
<td align="center">1,563</td>
<td align="center">4</td>
<td align="center">429</td>
<td align="center">0</td>
</tr>
<tr>
<td align="left">&#x2003;Fatigue</td>
<td align="center">1,143</td>
<td align="center">0</td>
<td align="center">248</td>
<td align="center">0</td>
</tr>
<tr>
<td align="left">&#x2003;Night Sweating</td>
<td align="center">789</td>
<td align="center">0</td>
<td align="center">135</td>
<td align="center">0</td>
</tr>
<tr>
<td colspan="5" align="left">Bacteriological Test</td>
</tr>
<tr>
<td align="left">&#x2003;Sputum Culture/Smear Positive</td>
<td align="center">807</td>
<td align="center">0</td>
<td align="center">297</td>
<td align="center">0</td>
</tr>
<tr>
<td align="left">&#x2003;Bacteriological Test Positive</td>
<td align="center">1788</td>
<td align="center">0</td>
<td align="center">509</td>
<td align="center">0</td>
</tr>
<tr>
<td align="left">&#x2003;Bacteriological Test Negative</td>
<td align="center">2,212</td>
<td align="center">3,703</td>
<td align="center">491</td>
<td align="center">925</td>
</tr>
<tr>
<td align="left">&#x2003;Total</td>
<td align="center">4,000</td>
<td align="center">3,703</td>
<td align="center">1,000</td>
<td align="center">925</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Sputum Culture/Smear Positive: sputum culture positive or smear positive. Bacteriological Test Positive: sputum culture/smear positive or Xpert test positve. Bacteriological Test Negative: sputum culture negative, sputum smear negative and Xpert test negative.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s2-2">
<title>X-Rays Images Preprocessing</title>
<p>As a tool widely used in medical image semantic segmentation, U-Net has been applied to extract semantic information and generate segmentation results (<xref ref-type="bibr" rid="B10">Ronneberger et al., 2015</xref>; <xref ref-type="bibr" rid="B17">Zunair and Ben Hamza, 2021</xref>). In order to focus on pulmonary TB-affected regions that appeared inside the lungs, U-Net was used for the lung segment before TB classification. After image cropping and resizing, the lung region images served as an input for the classification convolutional neural network (<xref ref-type="fig" rid="F2">Figure 2</xref>).</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Overall structure of the DCNN-based AI diagnosis system. The workflow of the system could be divided into two parts: image segmentation network (U-Net), image classification network (ResNet or VGG or AlexNet). Regions of the lung in the original chest X-ray photographs were recognized by the U-Net. Then, the cropped and resized lung region images served as an input for image classification algorithms, which generated diagnoses.</p>
</caption>
<graphic xlink:href="fmolb-09-874475-g002.tif"/>
</fig>
</sec>
<sec id="s2-3">
<title>Development of AI Algorithms</title>
<p>For the classification network, we used ResNet34 (<xref ref-type="bibr" rid="B1">He et al., 2016</xref>), VGG (<xref ref-type="bibr" rid="B11">Simonyan and Zisserman, 2014</xref>) and AlexNet (<xref ref-type="bibr" rid="B2">Krizhevsky et al., 2012</xref>). The structures of the three convolutional neural networks were illustrated in <xref ref-type="fig" rid="F2">Figure 2</xref>. We loaded the pretrained model in ImageNet and replaced the last linear classification layer with a new linear layer for negative (individuals without TB) or positive (with TB) prediction. The ResNet model was trained for 120 epochs in total with chest X-ray images of the training set (<xref ref-type="sec" rid="s11">Supplementary Figure S1</xref>), setting the initial learning rate at 1e&#x2212;3 and using the inverse learning rate decay schedule. VGG and AlexNet were also trained with the same settings, and then three AI algorithms were validated on the testing set.</p>
</sec>
<sec id="s2-4">
<title>Comparison of AI Algorithms and Stratification Analysis</title>
<p>To evaluate the performance of the three models, the accuracy, sensitivity and specificity of the three models were calculated in both sets for comparison (<xref ref-type="table" rid="T2">Table 2</xref>), and the plots of receiver operating characteristic (ROC) curves with area under the curve (AUC) values were also generated with the pROC package. The AI algorithm with the best performance was chosen for the following analysis and visualization. To further investigate the reliability and robustness of the AI models, cases of the testing set were stratified into multiple subgroups based on their age, sex and respiratory symptoms, and then the AUC value of each model were calculated and compared within each subgroup with the pROC package.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>The performance of the models.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="left"/>
<th colspan="3" align="center">Training set</th>
<th rowspan="2" align="center">AUC (95% CI)</th>
<th colspan="3" align="center">Testing set</th>
<th rowspan="2" align="center">AUC (95% CI)</th>
</tr>
<tr>
<th align="center">Accuracy (%)</th>
<th align="center">Sensitivity (%)</th>
<th align="center">Specificity (%)</th>
<th align="center">Accuracy (%)</th>
<th align="center">Sensitivity (%)</th>
<th align="center">Specificity (%)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">AlexNet</td>
<td align="char" char=".">98.34</td>
<td align="char" char=".">98.58</td>
<td align="char" char=".">98.08</td>
<td align="char" char="(">0.9988 (0.9984&#x2013;0.9992)</td>
<td align="char" char=".">95.06</td>
<td align="char" char=".">93.20</td>
<td align="char" char=".">97.08</td>
<td align="char" char="(">0.9917 (0.9889&#x2013;0.9945)</td>
</tr>
<tr>
<td align="left">VGG</td>
<td align="char" char=".">99.03</td>
<td align="char" char=".">99.75</td>
<td align="char" char=".">98.24</td>
<td align="char" char="(">0.9998 (0.9997&#x2013;0.9999)</td>
<td align="char" char=".">94.96</td>
<td align="char" char=".">94.20</td>
<td align="char" char=".">95.78</td>
<td align="char" char="(">0.9902 (0.9872&#x2013;0.9932)</td>
</tr>
<tr>
<td align="left">ResNet</td>
<td align="char" char=".">99.92</td>
<td align="char" char=".">99.90</td>
<td align="char" char=".">99.95</td>
<td align="char" char="(">1 (1&#x2013;1)</td>
<td align="char" char=".">96.73</td>
<td align="char" char=".">95.50</td>
<td align="char" char=".">98.05</td>
<td align="char" char="(">0.9944 (0.9921&#x2013;0.9967)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>AUC, the area under the receiver operator characteristic curve; 95% CI: 95% confidence interval.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s2-5">
<title>Interpretability Analysis and Feature Visualization</title>
<p>After the comparison, ResNet algorithm was chosen for further interpretability analysis and feature visualization. After the global average pooling layer of ResNet, we obtained a 512-dimensional vector for each image. To visualize the learned feature, we used the t-SNE method, which could reduce the high-dimensional vector to a low-dimensional vector (<xref ref-type="bibr" rid="B13">Van et al., 2008</xref>). Here, we reduced each vector to 2-dimension and therefore, visualized the differences in high-dimensional complex features between the positive and negative images captured by the AI algorithm. We also obtained sets of feature maps from the last convolution layer of ResNet. Then, class activation maps (CAMs) were generated by the linear combination of the fully connected layer weights and feature maps (<xref ref-type="bibr" rid="B16">Zhou et al., 2016</xref>). Discriminative regions of the CAMs were in red (hot areas), indicating the AI-predicted TB regions.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<p>In the beginning of the study, 9628 X-ray images with detailed clinical information were collected (<xref ref-type="fig" rid="F1">Figure 1</xref>). Clinical characteristics of the collected cases were summarized in <xref ref-type="table" rid="T1">Table 1</xref>. Three different AI algorithms were trained on a large dataset containing 4,000 images from patients with TB and 3,703 images from individuals without TB (<xref ref-type="fig" rid="F2">Figure 2</xref>). After training, these AI algorithms were compared to each other on the testing set and the training set. The accuracy, sensitivity and specificity of the three algorithms were all higher than 94% when they were tested on the testing set (<xref ref-type="table" rid="T2">Table 2</xref>). The ResNet model had the strongest diagnostic ability among the three AI algorithms, whose accuracy, sensitivity and specificity reached 96.73, 95.50 and 98.05%, respectively. The performance of the AI models were further investigated with ROC curves. All the AI algorithms performed well in both training set and testing set (<xref ref-type="fig" rid="F3">Figures 3A,B</xref>), with AUC values higher than 0.99 (<xref ref-type="table" rid="T2">Table 2</xref>). The AUC value of the AlexNet, VGG and ResNet reached 0.9917, 0.9902 and 0.9944, respectively on the testing set. These results suggested that the ResNet algorithm outperformed the rest models, demonstrating its excellent diagnostic value for TB and was selected for further analysis and visualization.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Diagnostic ability of the AI models. <bold>(A)</bold> ROC curves of three different AI models of the training set. <bold>(B)</bold> ROC curves of three different AI models of the testing set. <bold>(C)</bold> Diagnostic ability of ResNet algorithm visualized by t-SNE algorithm. Blue and orange dots indicated TB and non-TB cases of the testing set, respectively.</p>
</caption>
<graphic xlink:href="fmolb-09-874475-g003.tif"/>
</fig>
<p>To understand how the AI algorithms distinguished TB radiographs from non-TB ones, the dimensional reduction t-SNE algorithm was applied to reduce the high-dimensional differences in visual-semantic information aggregated by the AI algorithm between TB-positive and TB-negative images into a two-dimensional plot. Here, taking ResNet as an example, an evident boundary was observed between the positive and negative image groups, while clustered distributions within each group were also observed, indicating that the ResNet algorithm succeeded in recognizing shared features of TB-positive images and features that distinguished the positive and negative images (<xref ref-type="fig" rid="F3">Figure 3C</xref>).</p>
<p>Apart from evaluating the diagnostic accuracy on the entire testing set or training set, stratification analysis was also conducted to verified the reliability and the robustness of the ResNet algorithm. The ResNet model was the best performing model with highest AUC value in all subgroups of the training set and most subgroups of the testing set (<xref ref-type="fig" rid="F4">Figure 4</xref>). The result of the stratification analysis suggested that the ResNet algorithm was capable of providing accurate TB diagnoses for people of all ages and both sexes or patients with different respiratory symptoms.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Stratification analysis. Subgrouping by important clinical characteristics, including sex <bold>(A,D)</bold>, age <bold>(B,E)</bold> and respiratory symptoms <bold>(C,F)</bold>, AUC values of the three models were calculated and compared in both sets. Young: under 65&#xa0;years old. Old: 65&#xa0;years old or over 65&#xa0;years old.</p>
</caption>
<graphic xlink:href="fmolb-09-874475-g004.tif"/>
</fig>
<p>In order to step further in assisting the TB diagnosis, we visualized the ResNet algorithm recognized TB affected regions of the chest radiographs using the OpenCV package. Masked with red and alpha-blended with the black-and-white input X-ray image, &#x201c;hot regions&#x201d; drawn by AI provided accurate disease-affected areas and indicated high consistency with the TB regions mapped by experienced physicians and radiologists with bounding boxes (<xref ref-type="fig" rid="F5">Figure 5</xref>). Our method not only provided a correct diagnosis of pulmonary TB but also identified precise TB regions with a heatmap, which has great potential in assisting the diagnosis of TB as an interpretable and reliable AI algorithm.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>CAMs generated by ResNet matched the precise regions of TB abnormalities. Bounding boxes [in <bold>(A,C,E)</bold>] meant the regions of abnormalities identified by doctors and hot regions [in <bold>(B,D,F)</bold>] showed the discriminative regions generated by AI algorithm.</p>
</caption>
<graphic xlink:href="fmolb-09-874475-g005.tif"/>
</fig>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>As an effective method for TB screening and diagnosis, chest radiography is recommended by multiple clinical guidelines despite its high inter-radiologist and intra-radiologist variability, moderate specificity and other limitations. In contrast to manual diagnosis, deep learning based computer-assisted diagnostic systems have the potential to overcome the aforementioned drawbacks and provide professional diagnosis for TB. Here, we established a ResNet-based chest X-ray AI diagnosis system for TB, which provided accurate diagnoses and was capable of serving as triage tests at the bedside.</p>
<p>A previous study has reported that the AlexNet based machine learning algorithm can accurately classify TB based on chest radiography (<xref ref-type="bibr" rid="B3">Lakhani and Sundaram, 2017</xref>). Here, our results indicated that the ResNet-based AI was superior to AlexNet and VGG, which suggested that the ResNet diagnosis system would better assist physicians in diagnosing TB.</p>
<p>Low interpretability is one of the major inherent problems of the machine learning models, including deep learning algorithms. Due to the complex calculating process and tremendous amount parameters of the neural networks, it remains difficult for us to learn about how they work and why they come to certain conclusions that remarkably similar to human experts&#x2019; opinions, suggesting that the neural networks, especially deep neural networks, are so-called black boxes (<xref ref-type="bibr" rid="B14">Wang et al., 2021</xref>). Even though depth of the DCNNs are becoming sheerer and sheer, many tools, including t-SNE and CAMs, are still available for the visualization of neural networks and breaking up the black boxes, convincing us that the neural network algorithm have the ability to recognized features of abnormality in the medical images rather than nonrelevant parts of the graphs. In this study, we wanted to know whether the trained DCNN based AI algorithm was focusing at regions of TB-associated abnormality in the lung. As illustrated in <xref ref-type="fig" rid="F5">Figure 5</xref>, the discriminative regions, which were recognized by AI and masked with red, were the exact TB regions recognized and identified by doctors. This indicates that the ResNet-based AI algorithm not only provides doctors with highly accurate diagnoses but also interpretable marks of TB regions, which is of great help in analyzing chest X-ray images and recognizing TB in patients.</p>
<p>As a relatively remote and poor region with scarce medical resources in the past years, Xinjiang has been troubled by the continuous spread of TB (<xref ref-type="bibr" rid="B15">Zheng et al., 2021</xref>). Despite of financial difficulties, Xinjiang has managed to carry out many new policies and plans to boost investment in TB prevention and control, aiming at the early detection and proper treatment of TB cases. Early diagnosis of active TB is the key to controlling the rapid rise of TB incidence. Considering the excellent performance of the ResNet-based AI diagnosis system, it would greatly prompt the early diagnosis of active TB and help in preventing the spread of TB in Xinjiang.</p>
<p>However, there are several limitations in the study. First, although sputum culture is the gold standard for active pulmonary TB diagnosis, some patients of pulmonary TB have negative sputum culture results. Taking the results of multiple tests and typical clinical manifestation together, patients of TB were diagnosed, which remains risks of misdiagnoses and producing wrong labels for the chest radiographs. Besides, the chest radiographs were collected in two hospitals, suggesting that differences might exist between images captured in the two centers. In addition, we limited the study population to people aged &#x2265;15&#xa0;years, which also limited the generalizability of our AI diagnosis system towards pediatric cases.</p>
<p>In conclusion, our study established a ResNet-based AI diagnosis system that was effective in diagnosing active TB from chest radiographs without external clinical information assistance.</p>
</sec>
</body>
<back>
<sec id="s5">
<title>Data Availability Statement</title>
<p>The clinical data and chest radiographs are not publicly available for patient privacy protection purposes. Any individual affiliated with an academic institution may request access to the original images and clinical data from the corresponding author (MN) for non-commercial, research purposes.</p>
</sec>
<sec id="s6">
<title>Author Contributions</title>
<p>Study design and conception were proposed by GL and XZ; paper writing were done by MN, JM, CH, GL, and XZ; chest radiographs were collected by MN, AT, AA, AK, and XZ; AI model training, testing and visualizing were done by JM, CH, DZ, and GL. All authors interpreted the results and revised the manuscript. All authors read and approved the final manuscript.</p>
</sec>
<sec id="s7">
<title>Funding</title>
<p>This study was supported by the &#x201c;Tianshan Innovation Team Plan&#x201d; of the Autonomous Region (No. 2022D14007, MN), the Open Project of The State Key Laboratory for the Causes and Prevention of Middle Asian High Disease Jointly Built by the Province and the Ministry (No. SKL-HIDCA-2021-JH6, MN), Innovation Team Project of &#x201c;Pearl River Scholar Tianshan Talents&#x201d; Cooperative Expert Studio of The First People&#x2019;s Hospital of Kashi Prefecture (No. KDYY202017, MN).</p>
</sec>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ack>
<p>We would like to thank Editage (<ext-link ext-link-type="uri" xlink:href="http://www.editage.cn">www.editage.cn</ext-link>) for English language editing.</p>
</ack>
<sec id="s11">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmolb.2022.874475/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmolb.2022.874475/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet1.doc" id="SM1" mimetype="application/doc" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<sec id="s10">
<title>Abbreviations</title>
<p>AI, artificial intelligence; AUC, area under the curve; CAMs, class activation maps; DCNN, deep convolutional neural network; ROC, receiver operating characteristic; TB, <italic>tuberculosis.</italic>
</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>He</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Ren</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2016</year>). &#x201c;<article-title>Deep Residual Learning for Image Recognition</article-title>,&#x201d; in <conf-name>Proceedings of the 2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)</conf-name>, <conf-loc>Las Vegas, NV, USA</conf-loc>, <conf-date>December 2016</conf-date>. <pub-id pub-id-type="doi">10.1109/cvpr.2016.90</pub-id> </citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Krizhevsky</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Sutskever</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Hinton</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>ImageNet Classification with Deep Convolutional Neural Networks</article-title>. <source>Commun. ACM</source> <volume>60</volume>, <fpage>84</fpage>&#x2013;<lpage>90</lpage>. <comment>NIPS</comment>. <pub-id pub-id-type="doi">10.1145/3065386</pub-id> </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lakhani</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Sundaram</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Deep Learning at Chest Radiography: Automated Classification of Pulmonary Tuberculosis by Using Convolutional Neural Networks</article-title>. <source>Radiology</source> <volume>284</volume> (<issue>2</issue>), <fpage>574</fpage>&#x2013;<lpage>582</lpage>. <pub-id pub-id-type="doi">10.1148/radiol.2017162326</pub-id> </citation>
</ref>
<ref id="B4">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Organization</surname>
<given-names>W. H.</given-names>
</name>
</person-group> (<year>2016</year>). <source>Chest Radiography in Tuberculosis Detection: Summary of Current WHO Recommendations and Guidance on Programmatic Approaches</source>. <publisher-loc>Geneva</publisher-loc>: <publisher-name>World Health Organization</publisher-name>. </citation>
</ref>
<ref id="B5">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Organization</surname>
<given-names>W. H.</given-names>
</name>
</person-group> (<year>2021</year>). <source>WHO Consolidated Guidelines on Tuberculosis: Module 2: Screening: Systematic Screening for Tuberculosis Disease</source>. <publisher-loc>Geneva</publisher-loc>: <publisher-name>World Health Organization</publisher-name>. </citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qin</surname>
<given-names>Z. Z.</given-names>
</name>
<name>
<surname>Ahmed</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sarker</surname>
<given-names>M. S.</given-names>
</name>
<name>
<surname>Paul</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Adel</surname>
<given-names>A. S. S.</given-names>
</name>
<name>
<surname>Naheyan</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2021a</year>). <article-title>Tuberculosis Detection from Chest X-Rays for Triaging in a High Tuberculosis-burden Setting: an Evaluation of Five Artificial Intelligence Algorithms</article-title>. <source>The Lancet Digital Health</source> <volume>3</volume> (<issue>9</issue>), <fpage>e543</fpage>&#x2013;<lpage>e554</lpage>. <pub-id pub-id-type="doi">10.1016/S2589-7500(21)00116-3</pub-id> </citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qin</surname>
<given-names>Z. Z.</given-names>
</name>
<name>
<surname>Naheyan</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Ruhwald</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Denkinger</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>Gelaw</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Nash</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2021b</year>). <article-title>A New Resource on Artificial Intelligence Powered Computer Automated Detection Software Products for Tuberculosis Programmes and Implementers</article-title>. <source>Tuberculosis</source> <volume>127</volume>, <fpage>102049</fpage>. <pub-id pub-id-type="doi">10.1016/j.tube.2020.102049</pub-id> </citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ragonnet</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Trauer</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Geard</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Scott</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>McBryde</surname>
<given-names>E. S.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Profiling <italic>Mycobacterium tuberculosis</italic> Transmission and the Resulting Disease burden in the Five Highest Tuberculosis burden Countries</article-title>. <source>BMC Med.</source> <volume>17</volume> (<issue>1</issue>), <fpage>208</fpage>. <pub-id pub-id-type="doi">10.1186/s12916-019-1452-0</pub-id> </citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rajpurkar</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>O&#x2019;Connell</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Schechter</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Asnani</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Kiani</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>CheXaid: Deep Learning Assistance for Physician Diagnosis of Tuberculosis Using Chest X-Rays in Patients with HIV</article-title>. <source>Npj Digit. Med.</source> <volume>3</volume>, <fpage>115</fpage>. <pub-id pub-id-type="doi">10.1038/s41746-020-00322-2</pub-id> </citation>
</ref>
<ref id="B10">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Ronneberger</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Fischer</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Brox</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2015</year>). &#x201c;<article-title>U-net: Convolutional Networks for Biomedical Image Segmentation</article-title>,&#x201d; in <source>Medical Image Computing and Computer-Assisted Intervention &#x2013; MICCAI 2015</source>. Editors <person-group person-group-type="editor">
<name>
<surname>Navab</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Hornegger</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wells</surname>
<given-names>W. M.</given-names>
</name>
<name>
<surname>Frangi</surname>
<given-names>A. F.</given-names>
</name>
</person-group> (<publisher-loc>New York City, NY</publisher-loc>: <publisher-name>Springer International Publishing</publisher-name>), <fpage>234</fpage>&#x2013;<lpage>241</lpage>. </citation>
</ref>
<ref id="B11">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Simonyan</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Zisserman</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Very Deep Convolutional Networks for Large-Scale Image Recognition</article-title>. <comment>Available: <ext-link ext-link-type="uri" xlink:href="https://ui.adsabs.harvard.edu/abs/2014arXiv1409.1556S">https://ui.adsabs.harvard.edu/abs/2014arXiv1409.1556S</ext-link> (Accessed September 01, 2014)</comment>. </citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tusun</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Abulimiti</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Abulimiti</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Mamuti</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>The Epidemiological Characteristics of Pulmonary Tuberculosis - Kashgar Prefecture, Xinjiang Uygur Autonomous Region, China, 2011-2020</article-title>. <source>China CDC Wkly</source> <volume>3</volume> (<issue>26</issue>), <fpage>557</fpage>&#x2013;<lpage>561</lpage>. <pub-id pub-id-type="doi">10.46234/ccdcw2021.144</pub-id> </citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Van</surname>
<given-names>D. M. L.</given-names>
</name>
<name>
<surname>Hinton</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Visualizing High-Dimensional Data Using T-SNE</article-title>. <source>J. Machine Learn. Res.</source> <volume>9</volume> (<issue>2</issue>), <fpage>2579</fpage>&#x2013;<lpage>2605</lpage>. </citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Z. J.</given-names>
</name>
<name>
<surname>Turko</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Shaikh</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Das</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Hohman</surname>
<given-names>F.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>CNN Explainer: Learning Convolutional Neural Networks with Interactive Visualization</article-title>. <source>IEEE Trans. Vis. Comput. Graphics</source> <volume>27</volume> (<issue>2</issue>), <fpage>1396</fpage>&#x2013;<lpage>1406</lpage>. <pub-id pub-id-type="doi">10.1109/TVCG.2020.3030418</pub-id> </citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zheng</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Cui</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Predictive Study of Tuberculosis Incidence by Time Series Method and Elman Neural Network in Kashgar, China</article-title>. <source>BMJ Open</source> <volume>11</volume> (<issue>1</issue>), <fpage>e041040</fpage>. <pub-id pub-id-type="doi">10.1136/bmjopen-2020-041040</pub-id> </citation>
</ref>
<ref id="B16">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Khosla</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lapedriza</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Oliva</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Torralba</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2016</year>). &#x201c;<article-title>Learning Deep Features for Discriminative Localization</article-title>,&#x201d; in <conf-name>Proceedings of the 2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)</conf-name>, <conf-loc>Las Vegas, NV, USA</conf-loc>, <conf-date>June 2016</conf-date>. <pub-id pub-id-type="doi">10.1109/cvpr.2016.319</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zunair</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Ben Hamza</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Sharp U-Net: Depthwise Convolutional Network for Biomedical Image Segmentation</article-title>. <source>Comput. Biol. Med.</source> <volume>136</volume>, <fpage>104699</fpage>. <pub-id pub-id-type="doi">10.1016/j.compbiomed.2021.104699</pub-id> </citation>
</ref>
</ref-list>
</back>
</article>