<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Oncol.</journal-id>
<journal-title>Frontiers in Oncology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Oncol.</abbrev-journal-title>
<issn pub-type="epub">2234-943X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fonc.2023.1196414</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Oncology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Generalization optimizing machine learning to improve CT scan radiomics and assess immune checkpoint inhibitors&#x2019; response in non-small cell lung cancer: a multicenter cohort study</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Tonneau</surname>
<given-names>Marion</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1328960"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Phan</surname>
<given-names>Kim</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Manem</surname>
<given-names>Venkata S. K.</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/349271"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Low-Kam</surname>
<given-names>Cecile</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Dutil</surname>
<given-names>Francis</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Kazandjian</surname>
<given-names>Suzanne</given-names>
</name>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Vanderweyen</surname>
<given-names>Davy</given-names>
</name>
<xref ref-type="aff" rid="aff7">
<sup>7</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/540369"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Panasci</surname>
<given-names>Justin</given-names>
</name>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Malo</surname>
<given-names>Julie</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2322403"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Coulombe</surname>
<given-names>Fran&#xe7;ois</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Gagn&#xe9;</surname>
<given-names>Andr&#xe9;anne</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Elkrief</surname>
<given-names>Arielle</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff8">
<sup>8</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Belka&#xef;d</surname>
<given-names>Wiam</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Di Jorio</surname>
<given-names>Lisa</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2355411"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Orain</surname>
<given-names>Michele</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Bouchard</surname>
<given-names>Nicole</given-names>
</name>
<xref ref-type="aff" rid="aff9">
<sup>9</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2310445"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Muanza</surname>
<given-names>Thierry</given-names>
</name>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
<xref ref-type="aff" rid="aff10">
<sup>10</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/66523"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Rybicki</surname>
<given-names>Frank J.</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Kafi</surname>
<given-names>Kam</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/830238"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Huntsman</surname>
<given-names>David</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Joubert</surname>
<given-names>Philippe</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="aff" rid="aff11">
<sup>11</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Chandelier</surname>
<given-names>Florent</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Routy</surname>
<given-names>Bertrand</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff8">
<sup>8</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1326364"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Cancer Research, Centre de Recherche du Centre Hospitalier Universitaire de Montr&#xe9;al (CRCHUM)</institution>, <addr-line>Montreal, QC</addr-line>, <country>Canada</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Universit&#xe9; de M&#xe9;decine</institution>, <addr-line>Lille</addr-line>, <country>France</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Imagia Canexia Health</institution>, <addr-line>Montreal, QC</addr-line>, <country>Canada</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Institut Universitaire de Cardiologie et de Pneumologie de Quebec, Universit&#xe9; Laval</institution>, <addr-line>Qu&#xe9;bec City, QC</addr-line>, <country>Canada</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Department of Mathematics and Computer Science, University of Quebec at Trois-Rivi&#xe8;res</institution>, <addr-line>Trois-Rivi&#xe8;res, QC</addr-line>, <country>Canada</country>
</aff>
<aff id="aff6">
<sup>6</sup>
<institution>Department of Medical Oncology, Jewish General Hospital</institution>, <addr-line>Montreal, QC</addr-line>, <country>Canada</country>
</aff>
<aff id="aff7">
<sup>7</sup>
<institution>Department of Radiology, Centre Hospitalier de Sherbrooke (CHUS)</institution>, <addr-line>Sherbrooke, QC</addr-line>, <country>Canada</country>
</aff>
<aff id="aff8">
<sup>8</sup>
<institution>Hemato-Oncology Division, Centre Hospitalier de l&#x2019;universit&#xe9; de Montreal</institution>, <addr-line>Montreal, QC</addr-line>, <country>Canada</country>
</aff>
<aff id="aff9">
<sup>9</sup>
<institution>Department of Oncology, Centre Hospitalier de Sherbrooke (CHUS)</institution>, <addr-line>Sherbrooke, QC</addr-line>, <country>Canada</country>
</aff>
<aff id="aff10">
<sup>10</sup>
<institution>Department of Radiation Oncology, Lady Davis Institute of the Jewish General Hospital</institution>, <addr-line>Montreal, QC</addr-line>, <country>Canada</country>
</aff>    <aff id="aff11">
<sup>11</sup>
<institution>Department of Pathology, Institut Universitaire de Cardiologie et de Pneumologie de Qu&#xe9;bec</institution>, <addr-line>Qu&#xe9;bec, QC</addr-line>, <country>Canada</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Donghong Zhang, Emory University, United States</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Fran&#xe7;ois Lucia, Centre Hospitalier Regional Universitaire (CHU) de Brest, France; Han Yu, Roswell Park Comprehensive Cancer Center, United States</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Bertrand Routy, <email xlink:href="mailto:bertrand.routy@umontreal.ca">bertrand.routy@umontreal.ca</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>20</day>
<month>07</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>13</volume>
<elocation-id>1196414</elocation-id>
<history>
<date date-type="received">
<day>29</day>
<month>03</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>28</day>
<month>06</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2023 Tonneau, Phan, Manem, Low-Kam, Dutil, Kazandjian, Vanderweyen, Panasci, Malo, Coulombe, Gagn&#xe9;, Elkrief, Belka&#xef;d, Di Jorio, Orain, Bouchard, Muanza, Rybicki, Kafi, Huntsman, Joubert, Chandelier and Routy</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Tonneau, Phan, Manem, Low-Kam, Dutil, Kazandjian, Vanderweyen, Panasci, Malo, Coulombe, Gagn&#xe9;, Elkrief, Belka&#xef;d, Di Jorio, Orain, Bouchard, Muanza, Rybicki, Kafi, Huntsman, Joubert, Chandelier and Routy</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Background</title>
<p>Recent developments in artificial intelligence suggest that radiomics may represent a promising non-invasive biomarker to predict response to immune checkpoint inhibitors (ICIs). Nevertheless, validation of radiomics algorithms in independent cohorts remains a challenge due to variations in image acquisition and reconstruction. Using radiomics, we investigated the importance of scan normalization as part of a broader machine learning framework to enable model external generalizability to predict ICI response in non-small cell lung cancer (NSCLC) patients across different centers.</p>
</sec>
<sec>
<title>Methods</title>
<p>Radiomics features were extracted and compared from 642 advanced NSCLC patients on pre-ICI scans using established open-source PyRadiomics and a proprietary DeepRadiomics deep learning technology. The population was separated into two groups: a discovery cohort of 512 NSCLC patients from three academic centers and a validation cohort that included 130 NSCLC patients from a fourth center. We harmonized images to account for variations in reconstruction kernel, slice thicknesses, and device manufacturers. Multivariable models, evaluated using cross-validation, were used to estimate the predictive value of clinical variables, PD-L1 expression, and PyRadiomics or DeepRadiomics for progression-free survival at 6 months (PFS-6).</p>
</sec>
<sec>
<title>Results</title>
<p>The best prognostic factor for PFS-6, excluding radiomics features, was obtained with the combination of Clinical + PD-L1 expression (AUC = 0.66 in the discovery and 0.62 in the validation cohort). Without image harmonization, combining Clinical + PyRadiomics or DeepRadiomics delivered an AUC = 0.69 and 0.69, respectively, in the discovery cohort, but dropped to 0.57 and 0.52, in the validation cohort. This lack of generalizability was consistent with observations in principal component analysis clustered by CT scan parameters. Subsequently, image harmonization eliminated these clusters. The combination of Clinical + DeepRadiomics reached an AUC = 0.67 and 0.63 in the discovery and validation cohort, respectively. Conversely, the combination of Clinical + PyRadiomics failed generalizability validations, with AUC = 0.66 and 0.59.</p>
</sec>
<sec>
<title>Conclusion</title>
<p>We demonstrated that a risk prediction model combining Clinical + DeepRadiomics was generalizable following CT scan harmonization and machine learning generalization methods. These results had similar performances to routine oncology practice using Clinical + PD-L1. This study supports the strong potential of radiomics as a future non-invasive strategy to predict ICI response in advanced NSCLC.</p>
</sec>
</abstract>
<kwd-group>
<kwd>radiomics</kwd>
<kwd>Deeplearning</kwd>
<kwd>NSCLC</kwd>
<kwd>immunotherapy</kwd>
<kwd>DeepRadiomics</kwd>
</kwd-group>
<contract-sponsor id="cn001">Fondation pour la Recherche Nuovo-Soldati<named-content content-type="fundref-id">10.13039/501100009691</named-content>
</contract-sponsor>
<counts>
<fig-count count="4"/>
<table-count count="1"/>
<equation-count count="0"/>
<ref-count count="38"/>
<page-count count="10"/>
<word-count count="4354"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Thoracic Oncology</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<title>Introduction</title>
<p>The recent advent of radiomics by quantitative image analysis has been gaining interest in oncology as a novel strategy for cancer screening and predicting treatment response (<xref ref-type="bibr" rid="B1">1</xref>). Immune checkpoint inhibitors (ICIs) represent the standard of care for patients with advanced non-small cell lung cancer (NSCLC), and development of biomarkers represents a paramount interest (<xref ref-type="bibr" rid="B2">2</xref>&#x2013;<xref ref-type="bibr" rid="B4">4</xref>). Nevertheless, primary resistance to ICIs remains unpredictable, reaching up to 60%, while the rate of secondary resistance approaches 100% (<xref ref-type="bibr" rid="B5">5</xref>&#x2013;<xref ref-type="bibr" rid="B7">7</xref>). Assessment of PD-L1 expression in tumor tissue has been widely used to determine the therapeutic approach of either a single-agent anti-PD-1 inhibitor or the combination of platinum doublet with anti-PD-1 for patients with tumor PD-L1 expression &#x2265;50% or &lt;50%, respectively (<xref ref-type="bibr" rid="B4">4</xref>, <xref ref-type="bibr" rid="B8">8</xref>).</p>
<p>Radiomics has been shown to predict CD8<sup>+</sup> T-cell infiltration and response to ICIs or radiotherapy (<xref ref-type="bibr" rid="B9">9</xref>&#x2013;<xref ref-type="bibr" rid="B12">12</xref>). Additional studies attempted to determine PD-L1 expression, the only approved predictive biomarker in advanced NSCLC (<xref ref-type="bibr" rid="B13">13</xref>, <xref ref-type="bibr" rid="B14">14</xref>). Nevertheless, validation of radiomic models requires large image datasets that include different cancer centers and a variety of computed tomography (CT) scanners. The necessary diversity is a major hurdle to validate published radiomics signatures in independent cohorts (<xref ref-type="bibr" rid="B15">15</xref>). Different image acquisition parameters and different reconstruction kernels with varying slice thicknesses alter the predictive potential of radiomics (<xref ref-type="bibr" rid="B16">16</xref>). Therefore, the development of signatures applicable across academic centers is a challenge that has stymied the adoption of radiomics in routine oncology clinical practice. Altogether, this highlights the importance of harmonizing image acquisition and reconstruction procedures to reduce multicenter variability before gathering data (<xref ref-type="bibr" rid="B17">17</xref>, <xref ref-type="bibr" rid="B18">18</xref>). In recent years, research efforts have focused on developing a statistical harmonization strategy called ComBat (<xref ref-type="bibr" rid="B18">18</xref>&#x2013;<xref ref-type="bibr" rid="B20">20</xref>). ComBat acts directly on already computed features, not on the original images. While a privacy advantage on one hand, this method is only capable of harmonizing for a single batch effect at a time; as further detailed (<xref ref-type="bibr" rid="B21">21</xref>), if variance in image acquisition and reconstruction protocols affects image properties, then different batches should be used for the same scanner corresponding to different settings. Furthermore, four assumptions have to be met for ComBat to generate valid results among which (<xref ref-type="bibr" rid="B1">1</xref>) covariates (if any) that might explain different distributions at two or more sites have to be identified and considered to redesign the original ComBat approach (<xref ref-type="bibr" rid="B2">2</xref>); the different sets of feature values to be realigned have to be independent, which challenges the very use of PyRadiomics known for many correlating features; and (<xref ref-type="bibr" rid="B3">3</xref>) determining a single transformation with ComBat from data with different tissue or tumor types does not always lead to satisfactory data realignments, because different texture patterns are not necessarily affected identically by the image acquisition and reconstruction protocols (<xref ref-type="bibr" rid="B21">21</xref>). Taking these constraints altogether, the present study hypothesized that developing specific machine learning generalization methods rather than applying more complex feature harmonization strategies might prove more successful.</p>
<p>In this study, using conventional harmonization techniques together with AI generalization strategies, we showed that a radiomic signature generated in a discovery cohort from three independent cancer centers of NSCLC patients amenable to ICI to predict PFS at 6 months could be validated in a fourth cohort. This new method designed for generalizability rather than traditional performance has the potential to further the use of radiomics in routine oncology practice.</p>
</sec>
<sec id="s2">
<title>Methods</title>
<sec id="s2_1">
<title>Study population</title>
<p>This retrospective study included 642 advanced NSCLC patients treated with anti-PD-1 alone or in combination with platinum-doublet chemotherapy between 2015 and 2021 in the chemotherapy-refractory or first-line settings. Signed, informed consent was obtained from each patient, and the study was approved by the Institutional Review Board [Human Ethics Committee (MP-02-2019-8091)] at four academic institutions where patient data were acquired: Centre Hospitalier de l&#x2019;Universit&#xe9; de Montr&#xe9;al (CHUM), Jewish General Hospital in Montreal (JGH), Institut Universitaire de Cardiologie et Pneumologie de Qu&#xe9;bec &#x2013; Universit&#xe9; Laval (IUCPQ-UL), and Centre Hospitalier de l&#x2019;Universit&#xe9; de Sherbrooke (CHUS). All patients with histology-proven stage III or IV NSCLC treated with ICI and with a pre-ICI CT scan were eligible for retrospective review. Response Evaluation Criteria in Solid Tumors (RECIST) criteria version 1.1 was used to assess tumor response, and all patients were followed until death or until the data were locked on 15 January 2022 (<xref ref-type="bibr" rid="B22">22</xref>).</p>
</sec>
<sec id="s2_2">
<title>Clinical data analysis</title>
<p>We separated the total population into two independent cohorts. All patients from CHUM, JGH, and IUCPQ comprised the discovery cohort (<italic>n</italic> = 512 patients) while patients from CHUS comprised the validation cohort (<italic>n</italic> = 130 patients). Baseline demographic and clinicopathological characteristics were compared between the discovery and validation cohort using chi-square or Fisher&#x2019;s exact test for categorical variables and Student&#x2019;s <italic>t</italic>-test or Mann&#x2013;Whitney <italic>U</italic> test for continuous variables, as appropriate. Clinical outcome of PFS at 6 months was used as the stronger outcome marker for NSCLC patients amenable to ICIs as this clinical marker was found to be one of the most robust (<xref ref-type="bibr" rid="B3">3</xref>). All patients included had a PFS superior to 6 months or progressed before.</p>
</sec>
<sec id="s2_3">
<title>Harmonization process</title>
<sec id="s2_3_1">
<title>CT scan normalization</title>
<p>Each primary lesion was manually annotated by a radiation oncologist or a radiologist for identifying the tumor&#x2019;s longest axis, on de-identified, pretreatment CT images. The following pre-processing steps were applied to all scans: resampling to 1-mm isometric voxels (to normalize pixel and slice thickness variation) followed by Hounsfield Unit (HU) truncation to a range &#x2212;400 HU to 1,024 HU (to reduce the impact of artifacts on radiomics features), followed by image noise normalization using a Laplacian of Gaussian filter from the PyRadiomics library with hyperparameter values for sigma2 = {1,3} (<xref ref-type="bibr" rid="B20">20</xref>, <xref ref-type="bibr" rid="B23">23</xref>) (see <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>).</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Radiomics workflows used in the study. The upper panel represents PyRadiomics pipeline including, sequentially, the segmentation input and hand-engineered feature extractions. The lower panel represents the DeepRadiomics pipeline with weakly supervised region extractions and automated feature learning extractions.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1196414-g001.tif"/>
</fig>
</sec>
<sec id="s2_3_2">
<title>Radiomics feature extraction</title>
<sec id="s2_3_2_1">
<title>PyRadiomics features extraction</title>
<p>We used a three-stage process to determine the region of interest (ROI) used for extracting radiomic features. The first stage consisted of CT scan alignment achieved by principal component analysis (PCoA), followed by chest isolation through mathematical morphology-based denoising, and finally chest segmentation based on connected regions (<xref ref-type="bibr" rid="B24">24</xref>). In the second stage, the lung was automatically segmented based on the detected skin boundary, rough segmentation of lung contour, and pulmonary parenchyma refinement. Next, this lung segmentation was intersected with a clustering-based nodule mask to identify a nodule ROI agnostic of size, position, and spreading near or through the pleura, utilizing the relative symmetry of the lung (<xref ref-type="bibr" rid="B25">25</xref>). These ROIs were then assessed for clinical appropriateness in view of known shortcomings of segmentation techniques reported in the radiomics literature that extend beyond the objective of the current study but for which, nonetheless, we present an alternative in the form of a new DeepRadiomics method. From the segmentation, the PyRadiomics library v3.0.1, an open-source python package for the extraction of radiomics features from medical imaging, was used to extract 94 candidate radiomics features: 19 first-order features and 75 second-order features with a Laplacian of Gaussian (LoG) filter applied (<xref ref-type="bibr" rid="B26">26</xref>). The reproducibility of extracting PyRadiomics features from different segmentations has been well studied, and a high reproducibility was reported for first-order, Laplacian, Gaussian-filtered features and texture features, but low reproducibility for shape and wavelet features. Indeed, wavelet features were extracted but omitted from analyses due to the high association with the acquisition parameters.</p>
</sec>
<sec id="s2_3_2_2">
<title>DeepRadiomics features extraction</title>
<p>We proposed a new data-driven alternative to the traditional PyRadiomics method. We followed the emerging interest in deep learning models to provide suitable high-throughput extraction of quantitative imaging features from medical images (<xref ref-type="bibr" rid="B27">27</xref>, <xref ref-type="bibr" rid="B28">28</xref>). A VGG16 backbone was pre-trained to learn image features followed by a SimCLR process, a self-learning framework for contrastive learning of visual representations (<xref ref-type="bibr" rid="B29">29</xref>, <xref ref-type="bibr" rid="B30">30</xref>). The pre-training datasets consisted of the public dataset [Lung Image Database Consortium (LIDC)], after applying the CT scan normalization procedure described in this article (<xref ref-type="bibr" rid="B31">31</xref>), in order to leverage a larger dataset of lung CT scans also obtained across multiple institutions and acquisition parameters. The pretraining was made on 2D patches of 48 &#xd7; 48 pixels, centered on the nodules. For each image in a batch, we applied two different sets of data augmentation (random translation, rotation, flip, gaussian blur, and zoom), while training the model to correctly identify pairs of images representing the same nodule among other nodules in the same batch. In our proposed method, relevant images were processed using the pretrained SimCLR network, and automatically learned features were extracted from its last convolutional layer. Patch input could not be smaller than 32 &#xd7; 32 due to the model architecture backbone, so we expanded context as needed for ROIs smaller than this. Finally, the full ROI bounding box derived from the annotation process was used instead of segmenting or delineating potential lesions as is usually required in radiomics, which we see as further contributing to clinical generalization.</p>
</sec>
<sec id="s2_3_2_3">
<title>Toward the generalizability of AI models across healthcare settings</title>
<p>We designed a global hyperparameter search framework (the &#x201c;GHPS&#x201d;) to autonomously determine the final artificial intelligence (AI) model based on generalization-optimizing parameter configurations rather than performance-optimizing configurations. GHPS is ideally implemented by iteratively performing cross-center cross-validation testing over all combinations of parameters composed of the following four methods (<xref ref-type="bibr" rid="B32">32</xref>): (a) feature extraction, (b) feature selection, (c) model selection, and (d) model hyperparameter tuning. To reduce computational complexity, we elected to perform cross-validation testing, after processing all data with our normalization strategy, over all combinations of parameters consisting of (i) feature selection, (ii) model selection, and (iii) model hyperparameter tuning. Finally, our cross-validation testing allowed for refining the estimated final model with the best average performance remaining within small cross-center variability in performance, thus ensuring optimal generalizability.</p>
<p>We used a Sobol sequence for the randomized hyperparameter search to construct low discrepancy sets (<xref ref-type="bibr" rid="B33">33</xref>). The feature selection space was optimized for removing highly correlated features using a Spearman rho method with thresholds ranging from 0.8 to 1, as well as evaluating the optimal feature reduction method from among (a) <italic>F</italic>-test, (b) three relief-based algorithms from the open-source library ReBATE (<xref ref-type="bibr" rid="B34">34</xref>), or (c) a custom implementation of the Maximum Relevance &#x2212; Minimum Redundancy strategy (<xref ref-type="bibr" rid="B35">35</xref>). Model selection space was optimized for identifying non-overfitting methods on our datasets (across folds) from logistic regression and XGboost, and then defining the optimal parametrization of such, considering (a) a metric of calibration with Nagekjerje&#x2019;s R index (average), (b) metrics of discrimination with the area under the curve (AUC), and (c) a metric of goodness of fit with the Brier&#x2019;s score; altogether, the agreement of these metrics is chosen as a proxy for generalizability due to their ability to capture (correlate with) the variance of the AUC (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;1</bold>
</xref>). Moreover, we extended this observation by measuring the Youden&#x2019;s <italic>J</italic> statistics from both the discovery and validation models where the Clinical + DeepRadiomics model had a superior Youden score compared to Clinical + PD-L1 or Clinical + PyRadiomics, informing on the probability of a model to support an informed decision as opposed to a random guess, taking into account all model predictions (<xref ref-type="supplementary-material" rid="SM2">
<bold>Supplementary Table&#xa0;2</bold>
</xref>).</p>
<p>The model with both best average and smallest variability in performance across folds was selected as the final model. The hyperparameter tuning space of the &#x201c;selected model&#x201d; was optimized for discovering the final 5 to 20 features best representing the complete information space (at each fold), inclusive of a set of 5 fixed features comprising lesion radius, ECOG score, age, smoking history (never/former/current), and first-line ICI (yes/no), with and without including PD-L1 status. In that manner, imaging features would only be identified in case of complementing clinically relevant features as per our primary objective.</p>
<p>We used the bootstrap 95% confidence interval of the model performance in the discovery cohort for establishing a judgment of generalizability to the validation cohort (<xref ref-type="bibr" rid="B36">36</xref>). We determined the success of a biomarker&#x2019;s generalizability test when its estimate of the AUC derived from the validation cohort fell within the confidence interval of estimate of the AUC derived from the discovery cohort.</p>
</sec>
</sec>
</sec>
</sec>
<sec id="s3" sec-type="results">
<title>Results</title>
<sec id="s3_1">
<title>Cohort description</title>
<p>This study included a total of 910 eligible patients from four institutions. A first selection was made on availability of imaging within 3 months prior to initiation of ICI therapy, which resulted in the exclusion of 147 patients. Then, we excluded 121 patients for which a primary lesion could not be clearly delineated in the annotation process, to reach a final population of 642 patients (<xref ref-type="supplementary-material" rid="SF1">
<bold>Supplementary Figure&#xa0;1</bold>
</xref>). A total of 512 patients from the discovery cohort had a median PFS of 5.5 months (95% CI [4.8&#x2013;6.7]) and 130 patients from the validation cohort had a median PFS of 6.1 months (95% CI [5.1&#x2013;7.5]) (<italic>p</italic> = 0.377). There were no statistical differences between the discovery and validation cohorts regarding the mean age, sex proportion, history of smoking, distribution of ECOG status, stage, or distribution of the PD-L1 group (all <italic>p</italic> &gt; 0.05) (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). However, a larger proportion of patients in the validation cohort received ICI as first-line therapy (72%) compared to the discovery cohort (39%) (<italic>p</italic> &lt; 0.001) (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). With respect to outcome, the proportion of patients in discovery and validation cohorts with PFS at 6 months were 51% and 46%, respectively (<italic>p</italic> = 0.377).</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Baseline characteristics of 642 patients segregated into the discovery and validation cohorts.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left"/>
<th valign="top" align="center">Discovery cohort<break/>n=512</th>
<th valign="top" align="center">Validation cohort<break/>n=130</th>
<th valign="top" align="center">
<italic>p-value</italic>
</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Age - median [IQR]</td>
<td valign="top" align="center">68.3 [62.3, 73.8]</td>
<td valign="top" align="center">67.1 [60.5, 72.8]</td>
<td valign="top" align="center">
<italic>0.232</italic>
</td>
</tr>
<tr>
<td valign="top" align="left">
<bold>Sex</bold> - n (%)<break/>&#x2003;Male<break/>&#x2003;Female</td>
<td valign="top" align="center">&#xa0;<break/>258 (51)<break/>254 (49)</td>
<td valign="top" align="center">&#xa0;<break/>69 (53)<break/>61 (47)</td>
<td valign="top" align="center">
<italic>&#xa0;</italic>
<break/>
<italic>0.653</italic>
</td>
</tr>
<tr>
<td valign="top" align="left">
<bold>Smoking history</bold> - n (%)<break/>&#x2003;Current or former<break/>&#x2003;Never</td>
<td valign="top" align="center">&#xa0;<break/>466 (92)<break/>46 (8)</td>
<td valign="top" align="center">&#xa0;<break/>125 (97)<break/>5 (3)</td>
<td valign="top" align="center">
<italic>&#xa0;</italic>
<break/>
<italic>0.067</italic>
</td>
</tr>
<tr>
<td valign="top" align="left">
<bold>ECOG status</bold> - n (%)<break/>&#x2003;0<break/>&#x2003;1<break/>&#x2003;&gt;2</td>
<td valign="top" align="center">&#xa0;<break/>137 (27)<break/>292 (59)<break/>68 (14)</td>
<td valign="top" align="center">&#xa0;<break/>37 (29)<break/>77 (59)<break/>16 (12)</td>
<td valign="top" align="center">
<italic>&#xa0;</italic>
<break/>
<italic>0.514</italic>
</td>
</tr>
<tr>
<td valign="top" align="left">
<bold>Stage</bold> - n (%)<break/>&#x2003;III<break/>&#x2003;IV</td>
<td valign="top" align="center">&#xa0;<break/>52 (10)<break/>460 (90)</td>
<td valign="top" align="center">&#xa0;<break/>11 (8)<break/>119 (92)</td>
<td valign="top" align="center">
<italic>&#xa0;</italic>
<break/>
<italic>0.642</italic>
</td>
</tr>
<tr>
<td valign="top" align="left">
<bold>Histology</bold> - n (%)<break/>&#x2003;Adenocarcinoma<break/>&#x2003;Squamous<break/>&#x2003;Other</td>
<td valign="top" align="center">&#xa0;<break/>404 (79)<break/>29 (6)<break/>79 (15)</td>
<td valign="top" align="center">&#xa0;<break/>89 (69)<break/>13 (10)<break/>28 (21)</td>
<td valign="top" align="center">
<italic>&#xa0;</italic>
<break/>
<italic>0.034</italic>
</td>
</tr>
<tr>
<td valign="top" align="left">
<bold>PD-L1 status</bold> - n (%)<break/>&#x2003;&lt;1%<break/>&#x2003;1-49%<break/>&#x2003;&#x2265;50%</td>
<td valign="top" align="center">&#xa0;<break/>97 (22)<break/>117 (27)<break/>223 (51)</td>
<td valign="top" align="center">&#xa0;<break/>36 (29.0)<break/>34 (27.4)<break/>54 (43.5)</td>
<td valign="top" align="center">
<italic>&#xa0;</italic>
<break/>
<italic>0.222</italic>
</td>
</tr>
<tr>
<td valign="top" align="left">
<bold>Line of treatment</bold> - n (%)<break/>&#x2003;First line<break/>&#x2003;Second line or more</td>
<td valign="top" align="center">&#xa0;<break/>197 (39)<break/>315 (61)</td>
<td valign="top" align="center">&#xa0;<break/>94 (72)<break/>36 (28)</td>
<td valign="top" align="center">
<italic>&#xa0;</italic>
<break/>
<italic>&lt;0.001</italic>
</td>
</tr>
<tr>
<td valign="top" align="left">
<bold>Type of treatment</bold> - n (%)<break/>&#x2003;ICI alone<break/>&#x2003;Chemotherapy-ICI</td>
<td valign="top" align="center">&#xa0;<break/>469 (91)<break/>43 (9)</td>
<td valign="top" align="center">&#xa0;<break/>76 (59)<break/>54 (41)</td>
<td valign="top" align="center">
<italic>&#xa0;</italic>
<break/>
<italic>&lt;0.001</italic>
</td>
</tr>
<tr>
<td valign="top" align="left">
<bold>Progression-free survival</bold> - n (%)<break/>&#x2003;&#x2265; 6 months<break/>&#x2003;&lt; 6 months</td>
<td valign="top" align="center">&#xa0;<break/>260 (51)<break/>252 (49)</td>
<td valign="top" align="center">&#xa0;<break/>60 (46)<break/>70 (54)</td>
<td valign="top" align="center">
<italic>&#xa0;</italic>
<break/>
<italic>0.377</italic>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Italic terms define the p-value.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3_2">
<title>Benchmark of clinical outcome prediction with standard clinicopathological features</title>
<p>First, we sought to define the role of standard-of-care prognostic score using only clinical variables (age, ECOG status, smoking status, and line of treatment) alone or in combination with PD-L1 expression to establish a benchmark for clinical outcome prediction. The best clinical prognostic factor for PFS-6 was obtained with the combination of Clinical + PD-L1 expression with an AUC of 0.66 (95% CI [0.61&#x2013;0.70]) in the discovery cohort and 0.62 (95% CI [0.53&#x2013;0.72]) in the validation cohort (<xref ref-type="supplementary-material" rid="SF2">
<bold>Supplementary Figures&#xa0;2A, D</bold>
</xref>). Clinical markers alone did not perform as well with an AUC of 0.64 (95% CI [0.59&#x2013;0.69]) and 0.58 (95% CI [0.49&#x2013;0.69]) in the discovery and validation cohort, respectively. Similarly, the AUC of the model with PD-L1 expression alone was 0.56 (95% CI [0.52&#x2013;0.61]) in the discovery cohort and 0.59 (95% CI [0.48&#x2013;0.70]) in the validation cohort (<xref ref-type="supplementary-material" rid="SF2">
<bold>Supplementary Figures&#xa0;2B, C, E, F</bold>
</xref>).</p>
</sec>
<sec id="s3_3">
<title>Radiomics prediction without harmonization</title>
<p>Subsequently, we measured the predictive role of radiomics with no harmonization. We used PCoA to facilitate the projection and visualization of high-dimensional radiomic feature data. Before data harmonization, using PyRadiomic features, we observed clustering by CT scan slice thickness, manufacturer, kernel, and academic centers (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2A</bold>
</xref>). PCoA obtained from DeepRadiomics revealed similar clustering effect across the different medical centers, CT vendors, reconstruction kernels, and slice thicknesses (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3A</bold>
</xref>). These clusters were expected based on the important difference in CT acquisition parameters from each center (<xref ref-type="supplementary-material" rid="SM3">
<bold>Supplementary Table&#xa0;3</bold>
</xref>). Without CT harmonization, a model combining Clinical + PyRadiomics or DeepRadiomics features to predict PFS-6 featured had an AUC of 0.69 (95% CI [0.64&#x2013;0.74]) and 0.69 (95% CI [0.64&#x2013;0.74]), respectively, in the discovery cohort (<xref ref-type="supplementary-material" rid="SF3">
<bold>Supplementary Figure&#xa0;3A</bold>
</xref>). Nevertheless, AUC in the validation cohorts did not generalize; the AUC was 0.57 for Clinical + PyRadiomics and 0.52 for Clinical + DeepRadiomics both outside their respected interval CI obtained in the discovery cohorts (<xref ref-type="supplementary-material" rid="SF3">
<bold>Supplementary Figure&#xa0;3B</bold>
</xref>).</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>
<bold>(A)</bold> Principal component analysis (PCoA) of PyRadiomics representation of various CT-scan acquisition parameters (Slide thickness, Manufacturer, Kernel, and Site) prior to image harmonization. <bold>(B)</bold> PCoA of PyRadiomics representation of various CT-scan acquisition parameters (Slide thickness, Manufacturer, Kernel, and Site) after image harmonization. PyRad, PyRadiomics.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1196414-g002.tif"/>
</fig>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>
<bold>(A)</bold> Principal component analysis (PCoA) of DeepRadiomics representation of various CT-scan acquisition parameters (Slide thickness, Manufacturer, Kernel, and Site) prior to image harmonization. <bold>(B)</bold> PCoA of DeepRadiomics representation of various CT-scan acquisition parameters (Slide thickness, Manufacturer, Kernel, and Site) after image harmonization. DeepRad, DeepRadiomics.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1196414-g003.tif"/>
</fig>
<p>Next, we aimed to include PD-L1 to these models to improve generalizability. First, PD-L1 did not increase the AUC in the discovery cohorts for both radiomic signatures with AUC reaching 0.71 compared to 0.69 without PD-L1 (<xref ref-type="supplementary-material" rid="SF3">
<bold>Supplementary Figure&#xa0;3C</bold>
</xref>). Second, the addition of PD-L1 did not support the generalizability of performances in the validation cohorts (<xref ref-type="supplementary-material" rid="SF3">
<bold>Supplementary Figure&#xa0;3D</bold>
</xref>).</p>
</sec>
<sec id="s3_4">
<title>Image processing-based harmonization of radiomics features</title>
<p>Following the normalization of raw CT scans data detailed in the &#x201c;CT scan normalization&#x201d; section, and processing first for PyRadiomics, we obtained a relatively homogeneous population for the clusters of slice thickness, manufacturer, and site (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2B</bold>
</xref>). Despite improvement in kernel distribution on the PCoA, visual clustering was still observed.</p>
<p>Next, the same normalization method alongside DeepRadiomics revealed a broad homogenization across the four parameters of interest including kernel (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3B</bold>
</xref>). Of note, we observed, after normalization, two populations across all PCoA. After further investigation, we confirmed that these populations were a result of the patch size of 48 &#xd7; 48 pixels used during pretraining of the VGG16 backbone introduced in the &#x201c;DeepRadiomics features extraction&#x201d; section (<xref ref-type="supplementary-material" rid="SF4">
<bold>Supplementary Figure&#xa0;4A</bold>
</xref>). To assess if the radius clusters were confounders for PFS-6 months, we represented a PCoA for DeepRadiomics features vs. PFS-6 months (<xref ref-type="supplementary-material" rid="SF4">
<bold>Supplementary Figure&#xa0;4B</bold>
</xref>). We observed that there was no association of radius cluster with PFS-6 months. Our results showed that, after normalization, we were able to mitigate for variation across medical centers, CT vendors, acquisition variability, and reconstruction kernels.</p>
</sec>
<sec id="s3_5">
<title>Performance of AI-based radiomics signature designed for generalizability</title>
<p>Having laid out the foundation to construct a radiomic signature across centers, we sought to implement a global hyperparameter search framework (the &#x201c;GHPS&#x201d;) to determine the optimal combination of machine learning and imaging features to establish a final radiomics biomarker to predict PFS-6.</p>
<p>First, using this construct, the combination of Clinical + PyRadiomics depicted an AUC of 0.66 (95% CI [0.61&#x2013;0.70]) and 0.59 (95% CI [0.49&#x2013;0.68]) in the discovery and validation cohorts, respectively, failing to meet the validation criteria for reproducibility (remaining within the discovery CI), <italic>de facto</italic> failing the generalizability objective (<xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;4A, B</bold>
</xref>).</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Receiver operating characteristic (ROC) curves for PFS-6 months prediction models with <bold>(A)</bold> Clinical (age, ECOG status, smoking status, and line of treatment) + PyRadiomics after harmonization, <bold>(B)</bold> Clinical + DeepRadiomics after harmonization in the discovery cohorts, <bold>(C)</bold> Clinical + PyRadiomics after harmonization, and <bold>(D)</bold> Clinical+ DeepRadiomics after harmonization in the validation cohorts. PyRad, PyRadiomics; DeepRad, DeepRadiomics.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-13-1196414-g004.tif"/>
</fig>
<p>Second, the combination of Clinical + DeepRadiomics features reached an AUC of 0.67 (95% CI [0.63&#x2013;0.73]) and 0.63 (95% CI [0.53&#x2013;0.73]) in the discovery and validation cohort, respectively (<xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;4C, D</bold>
</xref>). The validation cohort AUC of 0.63 also fell within its 95% CI estimate in the discovery cohort, meeting our generalizable objective. Interestingly, these results were comparable to Clinical + PD-L1 currently used in routine oncology practice. Moreover, both models also depicted a lower bound on the 95% CI of these models that was greater than 0.50 in the discovery cohort, confirming the predictive value of these models. Third, using both models, the addition of PD-L1 did not increase the performances (similar AUC) or the generalizability (<xref ref-type="supplementary-material" rid="SF5">
<bold>Supplementary Figures&#xa0;5A&#x2013;D</bold>
</xref>).</p>
<p>Finally, to provide valuable insights for future research to be leveraged as part of prior information for statistical study design, we conducted an exploratory assessment of non-inferiority using permutation analyses. Indeed, it is important to note that our study was not specifically designed or adequately powered for standard non-inferiority testing. Nonetheless, our findings indicate that the AUC of the Clinical + DeepRadiomics model was not statistically lower than the AUC of the Clinical + PD-L1 model (mean difference across permutations: 0.00035; <italic>p</italic>-value: 0.617<italic>).</italic>
</p>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<title>Discussion</title>
<p>Radiomics represent a promising non-invasive biomarker for patients amenable to ICI; however, generalizability especially in various centers represent the major limitation (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B19">19</xref>). In this large study of advanced NSCLC treated with ICI across four institutions, we demonstrated that a risk prediction model that combined Clinical + DeepRadiomics was generalizable and was non-inferior to the Clinical + PD-L1 model currently used by oncologists to predict PFS-6 months.</p>
<p>Importantly, our results showed that, after generalizability, DeepRadiomics methods had a better performance than the PyRadiomics pipeline. This could be explained by our proposed combination of traditional harmonization techniques, which, together with a generalization-optimizing AI framework, overcomes these limitations of previous models that did not generalize and enables clinical utility. Our AI framework involves two automated steps: the discovery of relevant imaging features using DeepRadiomics that delivers informative, reproducible, and stable compressed representation of an imaging data space, and a global hyperparameter search that iteratively loops over all combination of the three methods used in our modeling process: (a) feature selection that chooses the best algorithm that identifies features to include in the model, maintaining the most &#x201c;informative&#x201d; features, and removing noisy &#x201c;non-informative,&#x201d; irrelevant and redundant features; (b) model selection that determines which machine learning estimator to use; and (c) hyperparameter tuning, which defines the optimum hyperparameter values to use for each estimator. While computationally intensive, this global search allows for the data-driven exploration of the somewhat unpredictable interplay between models and features (<xref ref-type="bibr" rid="B23">23</xref>). Consequently, we avoided radiomics features that were independently selected from other factors and/or not solely derived from the training portion of the data (in the machine learning training&#x2013;validation&#x2013;test sense), typically subject to an often-overlooked look-ahead bias and loss of future generalizability, addressing the problem of inappropriately applying cross-validation methods to feature selection (<xref ref-type="bibr" rid="B37">37</xref>).</p>
<p>However, the addition to our signature combining DeepRadiomics + Clinical was not improved by the implementation of a third parameter such as PD-L1. This could be explained by the limited discovery dataset available in this trial, which would otherwise be necessary to increase model parameters with sufficient examples for machine learning. Altogether, we obtained strong AUC in the discovery cohort independent of PD-L1 expression; however, there was no evidence of generalizability in the validation cohorts. This observation confirms that in the absence of homogeneous PCoA, radiomics validation is limited.</p>
<p>Furthermore, we acknowledge limitations in this study. First, although the CT scans were obtained from four institutions, only two physicians (a radiation oncologist and a radiologist) performed the image segmentations, reducing inter-observer variabilities. Second, the use of PyRadiomics is limited by the radiomic features being extracted from segmented ROI that required at least some degree of direct planimetry (and therefore additional physician time), subject to inter-annotator variability (<xref ref-type="bibr" rid="B38">38</xref>). This limitation was not present for the DeepRadiomics method we proposed, which does not require a segmentation input. Third, the validation cohort baseline characteristics had more patients treated with first line, which could decrease the performance of our model. Indeed, prior chemotherapy could impact the image features. Also, combination treatment such as chemotherapy with immunotherapy could modify the reproducibility of our model. Nevertheless, the DeepRadiomics method and the AI generalizability framework were able to mitigate this challenge. Lastly, with a primary objective to assess model generalizability, we eventually lacked the power to undertake non-inferiority testing. Our current results would indeed motivate further investigation in that direction, on another larger cohort of patients.</p>
<p>In conclusion, this radiomics generalizability study was able to demonstrate that a DeepRadiomics signature with harmonization developed in a discovery cohort from various centers could overcome the negative impact of variable CT acquisition parameters and then could be validated in an independent cohort. This DeepRadiomics harmonization signature warrants further improvement and validation in external cohorts of patients with NSCLC treated with ICI and opens a new non-invasive biomarker strategy.</p>
</sec>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material</bold>
</xref>. Further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="s6" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>The studies involving human participants were reviewed and approved by MP-02-2019-8091. The patients/participants provided their written informed consent to participate in this study.</p>
</sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>MT annotated CT-scans, collected clinical data, and wrote and reviewed the manuscript. Imagia team (KP, CL-K, FD, LJ, FR, KK, DH, and FIC) completed statistical analysis, normalization, and radiomics features extraction. SK and JP collected clinical data. FrC annotated CT-scans. VM, DV JM, FIC, AG, WB, AE, MO, NB, TM, DH, PJ, and KP reviewed the manuscript. BR coordinated the project and reviewed the manuscript.</p>
</sec>
</body>
<back>
<sec id="s8" sec-type="funding-information">
<title>Funding</title>
<p>This work was supported by the Oncopole, the MEDTEQ Consortium, the TransMedTech Institute, and the Cancer Research Society, as part of the joint Onco-Tech Competition (BR, PJ, and Imagia), Marathon of Hope Montreal Cancer Consortium (BR), Institut du Cancer de Montr&#xe9;al NSCLC Biobank (BR), Terry Fox Clinician Scientist award (BR), Nuovo-Soldati Foundation for Cancer Research (MT), Bourse Maurice-Tubiana (MT), and Fonds de Recherche du Qu&#xe9;bec FRQS (BR and PJ). VM holds a salary support award from the Fonds de recherche du Qu&#xe9;bec &#x2013; Sant&#xe9; (FRQS: Quebec Foundation for Health Research). This project was supported by the FRQS, a start-up fund from the Quebec Heart &amp; Lung Institute Research Center, along with the Foundation grant from the Quebec Heart &amp; Lung Institute Research Center.</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>We thank the Quebec Respiratory Health Research Network-IUCPQ site Biobank for providing clinical data and tissue from the IUCPQ cohort.</p>
</ack>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>Author BR reports research funding with the company Imagia. Authors KP, CL-K, FD, LJ, FR, KK, DH, and FIC were Imagia employees at the time of the study.</p>
<p>The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fonc.2023.1196414/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fonc.2023.1196414/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Image_1.jpeg" id="SF1" mimetype="image/jpeg">
<label>Supplementary Figure&#xa0;1</label>
<caption>
<p>Flow chart diagram of exclusion and final studied cohorts.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Image_2.jpeg" id="SF2" mimetype="image/jpeg">
<label>Supplementary Figure&#xa0;2</label>
<caption>
<p>Receiver operating characteristic (ROC) curves for the prediction models without radiomics and only with <bold>(A)</bold> clinical (age, ECOG status, smoking status, and line of treatment) + immunohistochemistry PD-L1 tumor expression, <bold>(B)</bold> representing clinical alone and <bold>(C)</bold> immunohistochemistry PD-L1 tumor expression in the discovery and <bold>(D-F)</bold> validation cohorts.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Image_3.jpeg" id="SF3" mimetype="image/jpeg">
<label>Supplementary Figure&#xa0;3</label>
<caption>
<p>
<bold>(A)</bold> Receiver operating characteristic (ROC) curves for the prediction models with, clinical (age, ECOG status, smoking status, and line of treatment) + PyRadiomics before harmonization or clinical + DeepRadiomics before harmonization in the discovery cohorts <bold>(B)</bold> ROC curves of clinical + PyRadiomics before harmonization and clinical + DeepRadiomics before harmonization in the validation cohorts. <bold>(C,D)</bold> similar ROC curves but with the addiction of PD-L1 for the discovery and validation cohorts respectively.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Image_4.jpeg" id="SF4" mimetype="image/jpeg">
<label>Supplementary Figure&#xa0;4</label>
<caption>
<p>
<bold>(A)</bold> Principal component analysis (PCoA) of DeepRadiomics features after normalization depicted by the VGG16 backbone network input of 24 pixels <bold>(B)</bold> PCoA of DeepRadiomics features stratified by outcome PFS-6 months.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Image_5.jpeg" id="SF5" mimetype="image/jpeg">
<label>Supplementary Figure&#xa0;5</label>
<caption>
<p>Receiver operating characteristic (ROC) curves for PFS-6 months prediction models with <bold>(A)</bold> Clinical (age, ECOG status, smoking status, and line of treatment) + PyRadiomics + PD-L1 after harmonization in the discovery cohort <bold>(B)</bold> Clinical + PyRadiomics + PD-L1 after harmonization in the validation cohort and <bold>(C)</bold> clinical + DeepRadiomics + PD-L1 after harmonization in the discovery cohort <bold>(D)</bold> clinical + DeepRadiomics + PD-L1 after harmonization in the validation cohort. PyRad, PyRadiomics; DeepRad, DeepRadiomics.</p>
</caption>
</supplementary-material>
  <supplementary-material xlink:href="Table_1.pdf" id="SM1" mimetype="application/pdf">
<label>Supplementary Table&#xa0;1</label>
<caption>
<p>&#x2013; Generalizability of the performance of the prediction models using Nagelkerke&#x2019;s R, Bier&#x2019;s score and area under the curve (AUC) as measures of AI-model calibration.</p>
</caption>
</supplementary-material>
  <supplementary-material xlink:href="Table_2.pdf" id="SM2" mimetype="application/pdf">
<label>Supplementary Table&#xa0;2</label>
<caption>
<p>&#x2013; Determination of the Sensitivity and Specificity of the Model in discovery and validation cohorts using the Yonden&#x2019;s index.</p>
</caption>
</supplementary-material>
  <supplementary-material xlink:href="Table_3.pdf" id="SM3" mimetype="application/pdf">
<label>Supplementary Table&#xa0;3</label>
<caption>
<p>- Baseline characteristics of computed tomography scan characteristics in the discovery and validation cohorts.</p>
</caption>
</supplementary-material>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gillies</surname> <given-names>RJ</given-names>
</name>
<name>
<surname>Kinahan</surname> <given-names>PE</given-names>
</name>
<name>
<surname>Hricak</surname> <given-names>H</given-names>
</name>
</person-group>. <article-title>Radiomics: images are more than pictures, they are data</article-title>. <source>Radiology</source> (<year>2016</year>) <volume>278</volume>(<issue>2</issue>):<page-range>563&#x2013;77</page-range>. doi: <pub-id pub-id-type="doi">10.1148/radiol.2015151169</pub-id>
</citation>
</ref>
<ref id="B2">
<label>2</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gandhi</surname> <given-names>L</given-names>
</name>
<name>
<surname>Rodr&#xed;guez-Abreu</surname> <given-names>D</given-names>
</name>
<name>
<surname>Gadgeel</surname> <given-names>S</given-names>
</name>
<name>
<surname>Esteban</surname> <given-names>E</given-names>
</name>
<name>
<surname>Felip</surname> <given-names>E</given-names>
</name>
<name>
<surname>De Angelis</surname> <given-names>F</given-names>
</name>
<etal/>
</person-group>. <article-title>Pembrolizumab plus chemotherapy in metastatic non-Small-Cell lung cancer</article-title>. <source>N Engl J Med</source> (<year>2018</year>) <volume>378</volume>(<issue>22</issue>):<page-range>2078&#x2013;92</page-range>. doi: <pub-id pub-id-type="doi">10.1056/NEJMoa1801005</pub-id>
</citation>
</ref>
<ref id="B3">
<label>3</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hellmann</surname> <given-names>MD</given-names>
</name>
<name>
<surname>Paz-Ares</surname> <given-names>L</given-names>
</name>
<name>
<surname>Bernabe Caro</surname> <given-names>R</given-names>
</name>
<name>
<surname>Zurawski</surname> <given-names>B</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>SW</given-names>
</name>
<name>
<surname>Carcereny Costa</surname> <given-names>E</given-names>
</name>
<etal/>
</person-group>. <article-title>Nivolumab plus ipilimumab in advanced non-Small-Cell lung cancer</article-title>. <source>N Engl J Med</source> (<year>2019</year>) <volume>381</volume>(<issue>21</issue>):<page-range>2020&#x2013;31</page-range>. doi: <pub-id pub-id-type="doi">10.1056/NEJMoa1910231</pub-id>
</citation>
</ref>
<ref id="B4">
<label>4</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname> <given-names>HS</given-names>
</name>
<name>
<surname>Cha</surname> <given-names>H</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>J</given-names>
</name>
<name>
<surname>Park</surname> <given-names>WY</given-names>
</name>
<name>
<surname>Choi</surname> <given-names>YL</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>JM</given-names>
</name>
<etal/>
</person-group>. <article-title>Genomic scoring to determine clinical benefit of immunotherapy by targeted sequencing</article-title>. <source>Eur J Cancer</source> (<year>2019</year>) <volume>120</volume>:<fpage>65</fpage>&#x2013;<lpage>74</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ejca.2019.08.001</pub-id>
</citation>
</ref>
<ref id="B5">
<label>5</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reck</surname> <given-names>M</given-names>
</name>
<name>
<surname>Rodr&#xed;guez-Abreu</surname> <given-names>D</given-names>
</name>
<name>
<surname>Robinson</surname> <given-names>AG</given-names>
</name>
<name>
<surname>Hui</surname> <given-names>R</given-names>
</name>
<name>
<surname>Cs&#x151;szi</surname> <given-names>T</given-names>
</name>
<name>
<surname>F&#xfc;l&#xf6;p</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Five-year outcomes with pembrolizumab versus chemotherapy for metastatic non-Small-Cell lung cancer with PD-L1 tumor proportion score &#x2265; 50</article-title>. <source>J Clin Oncol</source> (<year>2021</year>) <volume>39</volume>(<issue>21</issue>):<page-range>2339&#x2013;49</page-range>. doi: <pub-id pub-id-type="doi">10.1200/JCO.21.00174</pub-id>
</citation>
</ref>
<ref id="B6">
<label>6</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gadgeel</surname> <given-names>S</given-names>
</name>
<name>
<surname>Rodr&#xed;guez-Abreu</surname> <given-names>D</given-names>
</name>
<name>
<surname>Speranza</surname> <given-names>G</given-names>
</name>
<name>
<surname>Esteban</surname> <given-names>E</given-names>
</name>
<name>
<surname>Felip</surname> <given-names>E</given-names>
</name>
<name>
<surname>D&#xf3;mine</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Updated analysis from KEYNOTE-189: pembrolizumab or placebo plus pemetrexed and platinum for previously untreated metastatic nonsquamous non-Small-Cell lung cancer</article-title>. <source>J Clin Oncol</source> (<year>2020</year>) <volume>38</volume>(<issue>14</issue>):<page-range>1505&#x2013;17</page-range>. doi: <pub-id pub-id-type="doi">10.1200/JCO.19.03136</pub-id>
</citation>
</ref>
<ref id="B7">
<label>7</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rodr&#xed;guez-Abreu</surname> <given-names>D</given-names>
</name>
<name>
<surname>Powell</surname> <given-names>SF</given-names>
</name>
<name>
<surname>Hochmair</surname> <given-names>MJ</given-names>
</name>
<name>
<surname>Gadgeel</surname> <given-names>S</given-names>
</name>
<name>
<surname>Esteban</surname> <given-names>E</given-names>
</name>
<name>
<surname>Felip</surname> <given-names>E</given-names>
</name>
<etal/>
</person-group>. <article-title>Pemetrexed plus platinum with or without pembrolizumab in patients with previously untreated metastatic nonsquamous NSCLC: protocol-specified final analysis from KEYNOTE-189</article-title>. <source>Ann Oncol</source> (<year>2021</year>) <volume>32</volume>(<issue>7</issue>):<page-range>881&#x2013;95</page-range>. doi: <pub-id pub-id-type="doi">10.1016/j.annonc.2021.04.008</pub-id>
</citation>
</ref>
<ref id="B8">
<label>8</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rizvi</surname> <given-names>H</given-names>
</name>
<name>
<surname>Sanchez-Vega</surname> <given-names>F</given-names>
</name>
<name>
<surname>La</surname> <given-names>K</given-names>
</name>
<name>
<surname>Chatila</surname> <given-names>W</given-names>
</name>
<name>
<surname>Jonsson</surname> <given-names>P</given-names>
</name>
<name>
<surname>Halpenny</surname> <given-names>D</given-names>
</name>
<etal/>
</person-group>. <article-title>Molecular determinants of response to anti-programmed cell death (PD)-1 and anti-programmed death-ligand 1 (PD-L1) blockade in patients with non-Small-Cell lung cancer profiled with targeted next-generation sequencing</article-title>. <source>J Clin Oncol</source> (<year>2018</year>) <volume>36</volume>(<issue>7</issue>):<page-range>633&#x2013;41</page-range>. doi: <pub-id pub-id-type="doi">10.1200/JCO.2017.75.3384</pub-id>
</citation>
</ref>
<ref id="B9">
<label>9</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Limkin</surname> <given-names>EJ</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>R</given-names>
</name>
<name>
<surname>Dercle</surname> <given-names>L</given-names>
</name>
<name>
<surname>Zacharaki</surname> <given-names>EI</given-names>
</name>
<name>
<surname>Robert</surname> <given-names>C</given-names>
</name>
<name>
<surname>Reuz&#xe9;</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>Promises and challenges for the implementation of computational medical imaging (radiomics) in oncology</article-title>. <source>Ann Oncol</source> (<year>2017</year>) <volume>28</volume>(<issue>6</issue>):<page-range>1191&#x2013;206</page-range>. doi: <pub-id pub-id-type="doi">10.1093/annonc/mdx034</pub-id>
</citation>
</ref>
<ref id="B10">
<label>10</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname> <given-names>R</given-names>
</name>
<name>
<surname>Limkin</surname> <given-names>EJ</given-names>
</name>
<name>
<surname>Vakalopoulou</surname> <given-names>M</given-names>
</name>
<name>
<surname>Dercle</surname> <given-names>L</given-names>
</name>
<name>
<surname>Champiat</surname> <given-names>S</given-names>
</name>
<name>
<surname>Han</surname> <given-names>SR</given-names>
</name>
<etal/>
</person-group>. <article-title>A radiomics approach to assess tumour-infiltrating CD8 cells and response to anti-PD-1 or anti-PD-L1 immunotherapy: an imaging biomarker, retrospective multicohort study</article-title>. <source>Lancet Oncol</source> (<year>2018</year>) <volume>19</volume>(<issue>9</issue>):<page-range>1180&#x2013;91</page-range>. doi: <pub-id pub-id-type="doi">10.1016/S1470-2045(18)30413-3</pub-id>
</citation>
</ref>
<ref id="B11">
<label>11</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Castello</surname> <given-names>A</given-names>
</name>
<name>
<surname>Castellani</surname> <given-names>M</given-names>
</name>
<name>
<surname>Florimonte</surname> <given-names>L</given-names>
</name>
<name>
<surname>Urso</surname> <given-names>L</given-names>
</name>
<name>
<surname>Mansi</surname> <given-names>L</given-names>
</name>
<name>
<surname>Lopci</surname> <given-names>E</given-names>
</name>
</person-group>. <article-title>The role of radiomics in the era of immune checkpoint inhibitors: a new protagonist in the jungle of response criteria</article-title>. <source>J Clin Med</source> (<year>2022</year>) <volume>11</volume>(<issue>6</issue>):<fpage>1740</fpage>. doi: <pub-id pub-id-type="doi">10.3390/jcm11061740</pub-id>
</citation>
</ref>
<ref id="B12">
<label>12</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname> <given-names>R</given-names>
</name>
<name>
<surname>Henry</surname> <given-names>T</given-names>
</name>
<name>
<surname>Laville</surname> <given-names>A</given-names>
</name>
<name>
<surname>Carr&#xe9;</surname> <given-names>A</given-names>
</name>
<name>
<surname>Hamaoui</surname> <given-names>A</given-names>
</name>
<name>
<surname>Bockel</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>Imaging approaches and radiomics: toward a new era of ultraprecision radioimmunotherapy</article-title>? <source>J Immunother Cancer</source> (<year>2022</year>) <volume>10</volume>(<issue>7</issue>):<elocation-id>e004848</elocation-id>. doi: <pub-id pub-id-type="doi">10.1136/jitc-2022-004848</pub-id>
</citation>
</ref>
<ref id="B13">
<label>13</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vanguri</surname> <given-names>RS</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>J</given-names>
</name>
<name>
<surname>Aukerman</surname> <given-names>AT</given-names>
</name>
<name>
<surname>Egger</surname> <given-names>JV</given-names>
</name>
<name>
<surname>Fong</surname> <given-names>CJ</given-names>
</name>
<name>
<surname>Horvat</surname> <given-names>N</given-names>
</name>
<etal/>
</person-group>. <article-title>Multimodal integration of radiology, pathology and genomics for prediction of response to PD-(L)1 blockade in patients with non-small cell lung cancer</article-title>. <source>Nat Cancer</source> (<year>2022</year>) <volume>13</volume>:<fpage>1</fpage>&#x2013;<lpage>14</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s43018-022-00416-8</pub-id>
</citation>
</ref>
<ref id="B14">
<label>14</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Aerts</surname> <given-names>HJWL</given-names>
</name>
<name>
<surname>Velazquez</surname> <given-names>ER</given-names>
</name>
<name>
<surname>Leijenaar</surname> <given-names>RTH</given-names>
</name>
<name>
<surname>Parmar</surname> <given-names>C</given-names>
</name>
<name>
<surname>Grossmann</surname> <given-names>P</given-names>
</name>
<name>
<surname>Carvalho</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>Decoding tumour phenotype by noninvasive imaging using a quantitative radiomics approach</article-title>. <source>Nat Commun</source> (<year>2014</year>) <volume>5</volume>:<fpage>4006</fpage>. doi: <pub-id pub-id-type="doi">10.1038/ncomms5006</pub-id>
</citation>
</ref>
<ref id="B15">
<label>15</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ibrahim</surname> <given-names>A</given-names>
</name>
<name>
<surname>Primakov</surname> <given-names>S</given-names>
</name>
<name>
<surname>Beuque</surname> <given-names>M</given-names>
</name>
<name>
<surname>Woodruff</surname> <given-names>HC</given-names>
</name>
<name>
<surname>Halilaj</surname> <given-names>I</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>G</given-names>
</name>
<etal/>
</person-group>. <article-title>Radiomics for precision medicine: current challenges, future prospects, and the proposal of a new framework</article-title>. <source>Methods</source> (<year>2021</year>) <volume>188</volume>:<page-range>20&#x2013;9</page-range>. doi: <pub-id pub-id-type="doi">10.1016/j.ymeth.2020.05.022</pub-id>
</citation>
</ref>
<ref id="B16">
<label>16</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>He</surname> <given-names>L</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Liang</surname> <given-names>C</given-names>
</name>
<name>
<surname>Liang</surname> <given-names>C</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Z</given-names>
</name>
</person-group>. <article-title>Effects of contrast-enhancement, reconstruction slice thickness and convolution kernel on the diagnostic performance of radiomics signature in solitary pulmonary nodule</article-title>. <source>Sci Rep</source> (<year>2016</year>) <volume>6</volume>:<fpage>34921</fpage>. doi: <pub-id pub-id-type="doi">10.1038/srep34921</pub-id>
</citation>
</ref>
<ref id="B17">
<label>17</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Berenguer</surname> <given-names>R</given-names>
</name>
<name>
<surname>Pastor-Juan</surname> <given-names>MDR</given-names>
</name>
<name>
<surname>Canales-V&#xe1;zquez</surname> <given-names>J</given-names>
</name>
<name>
<surname>Castro-Garc&#xed;a</surname> <given-names>M</given-names>
</name>
<name>
<surname>Villas</surname> <given-names>MV</given-names>
</name>
<name>
<surname>Mansilla Legorburo</surname> <given-names>F</given-names>
</name>
<etal/>
</person-group>. <article-title>Radiomics of CT features may be nonreproducible and redundant: influence of CT acquisition parameters</article-title>. <source>Radiology</source> (<year>2018</year>) <volume>288</volume>(<issue>2</issue>):<page-range>407&#x2013;15</page-range>. doi: <pub-id pub-id-type="doi">10.1148/radiol.2018172361</pub-id>
</citation>
</ref>
<ref id="B18">
<label>18</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Da-ano</surname> <given-names>R</given-names>
</name>
<name>
<surname>Masson</surname> <given-names>I</given-names>
</name>
<name>
<surname>Lucia</surname> <given-names>F</given-names>
</name>
<name>
<surname>Dor&#xe9;</surname> <given-names>M</given-names>
</name>
<name>
<surname>Robin</surname> <given-names>P</given-names>
</name>
<name>
<surname>Alfieri</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Performance comparison of modified ComBat for harmonization of radiomic features for multicenter studies</article-title>. <source>Sci Rep</source> (<year>2020</year>) <volume>10</volume>(<issue>1</issue>):<fpage>10248</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-020-66110-w</pub-id>
</citation>
</ref>
<ref id="B19">
<label>19</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Da-Ano</surname> <given-names>R</given-names>
</name>
<name>
<surname>Visvikis</surname> <given-names>D</given-names>
</name>
<name>
<surname>Hatt</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Harmonization strategies for multicenter radiomics investigations</article-title>. <source>Phys Med Biol</source> (<year>2020</year>) <volume>65</volume>(<issue>24</issue>):<fpage>24TR02</fpage>. doi: <pub-id pub-id-type="doi">10.1088/1361-6560/aba798</pub-id>
</citation>
</ref>
<ref id="B20">
<label>20</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Horng</surname> <given-names>H</given-names>
</name>
<name>
<surname>Singh</surname> <given-names>A</given-names>
</name>
<name>
<surname>Yousefi</surname> <given-names>B</given-names>
</name>
<name>
<surname>Cohen</surname> <given-names>EA</given-names>
</name>
<name>
<surname>Haghighi</surname> <given-names>B</given-names>
</name>
<name>
<surname>Katz</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>Generalized ComBat harmonization methods for radiomic features with multi-modal distributions and multiple batch effects</article-title>. <source>Sci Rep</source> (<year>2022</year>) <volume>12</volume>(<issue>1</issue>):<fpage>4493</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-022-08412-9</pub-id>
</citation>
</ref>
<ref id="B21">
<label>21</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Orlhac</surname> <given-names>F</given-names>
</name>
<name>
<surname>Eertink</surname> <given-names>JJ</given-names>
</name>
<name>
<surname>Cottereau</surname> <given-names>AS</given-names>
</name>
<name>
<surname>Zijlstra</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Thieblemont</surname> <given-names>C</given-names>
</name>
<name>
<surname>Meignan</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>A guide to ComBat harmonization of imaging biomarkers in multicenter studies</article-title>. <source>J Nucl Med</source> (<year>2022</year>) <volume>63</volume>(<issue>2</issue>):<page-range>172&#x2013;9</page-range>. doi: <pub-id pub-id-type="doi">10.2967/jnumed.121.262464</pub-id>
</citation>
</ref>
<ref id="B22">
<label>22</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Eisenhauer</surname> <given-names>EA</given-names>
</name>
<name>
<surname>Therasse</surname> <given-names>P</given-names>
</name>
<name>
<surname>Bogaerts</surname> <given-names>J</given-names>
</name>
<name>
<surname>Schwartz</surname> <given-names>LH</given-names>
</name>
<name>
<surname>Sargent</surname> <given-names>D</given-names>
</name>
<name>
<surname>Ford</surname> <given-names>R</given-names>
</name>
<etal/>
</person-group>. <article-title>New response evaluation criteria in solid tumours: revised RECIST guideline (version 1.1)</article-title>. <source>Eur J Cancer</source> (<year>2009</year>) <volume>45</volume>(<issue>2</issue>):<page-range>228&#x2013;47</page-range>. doi: <pub-id pub-id-type="doi">10.1016/j.ejca.2008.10.026</pub-id>
</citation>
</ref>
<ref id="B23">
<label>23</label>
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Johnson</surname> <given-names>MK</given-names>
</name>
<collab>K. Feature Engineering and Selection</collab>
</person-group>. <source>A practical approach for predictive models</source> (<year>2022</year>). Available at: <uri xlink:href="https://bookdown.org/max/FES/">https://bookdown.org/max/FES/</uri>.</citation>
</ref>
<ref id="B24">
<label>24</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>J</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>H</given-names>
</name>
</person-group>. <article-title>Automatic approach for lung segmentation with juxta-pleural nodules from thoracic CT based on contour tracing and correction</article-title>. <source>Comput Math Methods Med</source> (<year>2016</year>) <volume>2016</volume>:<fpage>2962047</fpage>. doi: <pub-id pub-id-type="doi">10.1155/2016/2962047</pub-id>
</citation>
</ref>
<ref id="B25">
<label>25</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kuruvilla</surname> <given-names>J</given-names>
</name>
<name>
<surname>Gunavathi</surname> <given-names>DK</given-names>
</name>
</person-group>. <article-title>Detection of lung cancer using morphological operations</article-title>. <source>Inter J Sci Engineer Res</source> (<year>2013</year>) <volume>4</volume>(<issue>8</issue>):<fpage>4</fpage>.</citation>
</ref>
<ref id="B26">
<label>26</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zwanenburg</surname> <given-names>A</given-names>
</name>
<name>
<surname>Leger</surname> <given-names>S</given-names>
</name>
<name>
<surname>Valli&#xe8;res</surname> <given-names>M</given-names>
</name>
<name>
<surname>L&#xf6;ck</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>Image biomarker standardisation initiative</article-title>. <source>Radiology</source> (<year>2020</year>) <volume>295</volume>(<issue>2</issue>):<page-range>328&#x2013;38</page-range>. doi: <pub-id pub-id-type="doi">10.1148/radiol.2020191145</pub-id>
</citation>
</ref>
<ref id="B27">
<label>27</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>J</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>W</given-names>
</name>
</person-group>. <article-title>Deep learning based radiomics (DLR) and its usage in noninvasive IDH1 prediction for low grade glioma</article-title>. <source>Sci Rep</source> (<year>2017</year>) <volume>7</volume>(<issue>1</issue>):<fpage>5467</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-017-05848-2</pub-id>
</citation>
</ref>
<ref id="B28">
<label>28</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>G</given-names>
</name>
<name>
<surname>Qiu</surname> <given-names>X</given-names>
</name>
<name>
<surname>Tan</surname> <given-names>W</given-names>
</name>
<name>
<surname>Yin</surname> <given-names>X</given-names>
</name>
<etal/>
</person-group>. <article-title>Deep learning with radiomics for disease diagnosis and treatment: challenges and potential</article-title>. <source>Front Oncol</source> (<year>2022</year>) <volume>12</volume>:<elocation-id>12</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fonc.2022.773840</pub-id>
</citation>
</ref>
<ref id="B29">
<label>29</label>
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>T</given-names>
</name>
<name>
<surname>Kornblith</surname> <given-names>S</given-names>
</name>
<name>
<surname>Norouzi</surname> <given-names>M</given-names>
</name>
<name>
<surname>Hinton</surname> <given-names>G</given-names>
</name>
</person-group>. <source>A simple framework for contrastive learning of visual representations [Internet]. arXiv</source> (<year>2020</year>). Available at: <uri xlink:href="http://arxiv.org/abs/2002.05709">http://arxiv.org/abs/2002.05709</uri>.</citation>
</ref>
<ref id="B30">
<label>30</label>
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>T</given-names>
</name>
<name>
<surname>Kornblith</surname> <given-names>S</given-names>
</name>
<name>
<surname>Swersky</surname> <given-names>K</given-names>
</name>
<name>
<surname>Norouzi</surname> <given-names>M</given-names>
</name>
<name>
<surname>Hinton</surname> <given-names>G</given-names>
</name>
</person-group>. <source>Big self-supervised models are strong semi-supervised learners [Internet]. arXiv</source> (<year>2020</year>). Available at: <uri xlink:href="http://arxiv.org/abs/2006.10029">http://arxiv.org/abs/2006.10029</uri>.</citation>
</ref>
<ref id="B31">
<label>31</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Armato</surname> <given-names>SG</given-names>
</name>
<name>
<surname>Roberts</surname> <given-names>RY</given-names>
</name>
<name>
<surname>McNitt-Gray</surname> <given-names>MF</given-names>
</name>
<name>
<surname>Meyer</surname> <given-names>CR</given-names>
</name>
<name>
<surname>Reeves</surname> <given-names>AP</given-names>
</name>
<name>
<surname>McLennan</surname> <given-names>G</given-names>
</name>
<etal/>
</person-group>. <article-title>The lung image database consortium (LIDC): ensuring the integrity of expert-defined &#x201c;truth&#x201d;</article-title>. <source>Acad Radiol</source> (<year>2007</year>) <volume>14</volume>(<issue>12</issue>):<page-range>1455&#x2013;63</page-range>. doi: <pub-id pub-id-type="doi">10.1016/j.acra.2007.08.006</pub-id>
</citation>
</ref>
<ref id="B32">
<label>32</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pudjihartono</surname> <given-names>N</given-names>
</name>
<name>
<surname>Fadason</surname> <given-names>T</given-names>
</name>
<name>
<surname>Kempa-Liehr</surname> <given-names>AW</given-names>
</name>
<name>
<surname>O&#x2019;Sullivan</surname> <given-names>JM</given-names>
</name>
</person-group>. <article-title>A review of feature selection methods for machine learning-based disease risk prediction</article-title>. <source>Front Bioinf</source> (<year>2022</year>) <volume>2</volume>:<elocation-id>927312</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fbinf.2022.927312</pub-id>
</citation>
</ref>
<ref id="B33">
<label>33</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bergstra</surname> <given-names>J</given-names>
</name>
<name>
<surname>Bengio</surname> <given-names>Y</given-names>
</name>
</person-group>. <article-title>Random search for hyper-parameter optimization</article-title>. <source>J Machine Learning Res</source> (<year>2012</year>) <volume>13</volume>:<page-range>281&#x2013;305</page-range>.</citation>
</ref>
<ref id="B34">
<label>34</label>
<citation citation-type="web">
<source>Home - ReBATE</source> (<year>2022</year>). Available at: <uri xlink:href="https://epistasislab.github.io/ReBATE/">https://epistasislab.github.io/ReBATE/</uri>.</citation>
</ref>
<ref id="B35">
<label>35</label>
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Anand</surname> <given-names>R</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>M</given-names>
</name>
</person-group>. <source>Maximum relevance and minimum redundancy feature selection methods for a marketing machine learning platform [Internet]. arXiv</source> (<year>2019</year>). Available at: <uri xlink:href="http://arxiv.org/abs/1908.05376">http://arxiv.org/abs/1908.05376</uri>.</citation>
</ref>
<ref id="B36">
<label>36</label>
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Banjanovic</surname> <given-names>ES</given-names>
</name>
<name>
<surname>Osborne</surname> <given-names>JW</given-names>
</name>
</person-group>. <source>Confidence intervals for effect sizes: applying bootstrap resampling</source> (<year>2022</year>). Available at: <uri xlink:href="https://scholarworks.umass.edu/pare/vol21/iss1/5/">https://scholarworks.umass.edu/pare/vol21/iss1/5/</uri>.</citation>
</ref>
<ref id="B37">
<label>37</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Hastie</surname> <given-names>T</given-names>
</name>
<name>
<surname>Tibshirani</surname> <given-names>R</given-names>
</name>
<name>
<surname>Friedman</surname> <given-names>J</given-names>
</name>
</person-group>. <source>Elements of statistical learning: data mining, inference, and prediction. 2nd edition</source>. <edition>2nd ed</edition>. <publisher-name>Springer</publisher-name>. (<year>2009</year>). Available at: <uri xlink:href="https://hastie.su.domains/ElemStatLearn/">https://hastie.su.domains/ElemStatLearn/</uri>.</citation>
</ref>
<ref id="B38">
<label>38</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Primakov</surname> <given-names>SP</given-names>
</name>
<name>
<surname>Ibrahim</surname> <given-names>A</given-names>
</name>
<name>
<surname>van Timmeren</surname> <given-names>JE</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>G</given-names>
</name>
<name>
<surname>Keek</surname> <given-names>SA</given-names>
</name>
<name>
<surname>Beuque</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Automated detection and segmentation of non-small cell lung cancer computed tomography images</article-title>. <source>Nat Commun</source> (<year>2022</year>) <volume>13</volume>(<issue>1</issue>):<fpage>3423</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41467-022-30841-3</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>