<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Artif. Intell.</journal-id>
<journal-title>Frontiers in Artificial Intelligence</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Artif. Intell.</abbrev-journal-title>
<issn pub-type="epub">2624-8212</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/frai.2025.1667167</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Artificial Intelligence</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>A dynamic multitask evolutionary algorithm for high-dimensional feature selection based on multi-indicator task construction and elite competition learning</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Tie</surname><given-names>Jinxin</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Yan</surname><given-names>Chunfang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Li</surname><given-names>Maosong</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Gong</surname><given-names>Jianqiang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Wu</surname><given-names>Yujie</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Fang</surname><given-names>Hailin</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Li</surname><given-names>Meng</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2939935/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Zhang</surname><given-names>Weiwei</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="corresp" rid="c002"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3136289/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Li</surname><given-names>Jie</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Ningbo Cigarette Factory, China Tobacco Zhejiang Industrial Co., Ltd.</institution>, <addr-line>Ningbo</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>Technology Center, China Tobacco Zhejiang Industrial Co., Ltd.</institution>, <addr-line>Hangzhou</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>College of Tobacco Science and Engineering, Zhengzhou University of Light Industry</institution>, <addr-line>Zhengzhou</addr-line>, <country>China</country></aff>
<aff id="aff4"><sup>4</sup><institution>College of Computer Science and Technology, Zhengzhou University of Light Industry</institution>, <addr-line>Zhengzhou</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by" id="fn0001"><p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2317559/overview">Ying Bi</ext-link>, Zhengzhou University, China</p></fn>
<fn fn-type="edited-by" id="fn0002"><p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3170049/overview">Emanuel Casmiry</ext-link>, Nelson Mandela African Institution of Science and Technology, Tanzania</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3185783/overview">Joko Triloka</ext-link>, Informatics and Business Institute Darmajaya, Indonesia</p></fn>
<corresp id="c001">&#x002A;Correspondence: Jie Li, <email>lijie@zjtobacco.com</email></corresp>
<corresp id="c002">Weiwei Zhang, <email>anqikeli@126.com</email></corresp>
</author-notes>
<pub-date pub-type="epub">
<day>20</day>
<month>10</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>8</volume>
<elocation-id>1667167</elocation-id>
<history>
<date date-type="received">
<day>16</day>
<month>07</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>29</day>
<month>09</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2025 Tie, Yan, Li, Gong, Wu, Fang, Li, Zhang and Li.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Tie, Yan, Li, Gong, Wu, Fang, Li, Zhang and Li</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>High-dimensional data often contain noisy and redundant features, posing challenges for accurate and efficient feature selection. To address this, a dynamic multitask learning framework is proposed, which integrates competitive learning and knowledge transfer within an evolutionary optimization setting. The framework begins by generating two complementary tasks through a multi-criteria strategy that combines multiple feature relevance indicators, ensuring both global comprehensiveness and local focus. These tasks are optimized in parallel using a competitive particle swarm optimization algorithm enhanced with hierarchical elite learning, where each particle learns from both winners and elite individuals to avoid premature convergence. To further improve optimization efficiency and diversity, a probabilistic elite-based knowledge transfer mechanism is introduced, allowing particles to selectively learn from elite solutions across tasks. Experimental results on 13 high-dimensional benchmark datasets demonstrate that the proposed algorithm achieves superior classification accuracy with fewer selected features compared to several state-of-the-art methods. Across 13 benchmarks, the proposed method achieves the highest accuracy on 11 out of 13 datasets and the fewest features on eight out of 13, with an average accuracy of 87.24% and an average dimensionality reduction of 96.2% (median 200 selected features), clearly validating its effectiveness in balancing exploration, exploitation, and knowledge sharing for robust feature selection.</p>
</abstract>
<kwd-group>
<kwd>feature selection</kwd>
<kwd>evolutionary multitask optimization</kwd>
<kwd>elite competition</kwd>
<kwd>knowledge transfer</kwd>
<kwd>high-dimensional data</kwd>
<kwd>tobacco data analytics</kwd>
</kwd-group>
<counts>
<fig-count count="8"/>
<table-count count="6"/>
<equation-count count="9"/>
<ref-count count="36"/>
<page-count count="15"/>
<word-count count="8866"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Machine Learning and Artificial Intelligence</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<label>1</label>
<title>Introduction</title>
<p>Feature selection has long been recognized as a critical step in machine learning and data mining, particularly when dealing with high-dimensional datasets. By identifying the most informative and non-redundant subset of features, feature selection not only improves model performance and interpretability but also significantly reduces computational costs. However, in high-dimensional spaces, the feature selection process becomes increasingly challenging due to the curse of dimensionality, feature redundancy, and complex interactions among variables.</p>
<p>Existing feature selection methods are broadly categorized into filter-based and wrapper-based approaches based on whether they rely on classifiers for subset evaluation. Filter methods assess features independently of any learning model, offering high efficiency and scalability, making them suitable for large-scale datasets (<xref ref-type="bibr" rid="ref12">Kamalov et al., 2025</xref>). Despite these advantages, their inability to consider interactions with learning algorithms often limits their performance in downstream classification tasks. In contrast, wrapper methods evaluate feature subsets by training predictive models, leading to better classification accuracy but incurring high computational costs, especially in high-dimensional settings (<xref ref-type="bibr" rid="ref22">Sadeghian et al., 2025</xref>).</p>
<p>Swarm intelligence algorithms, such as particle swarm optimization (PSO) and competitive swarm optimizer (CSO), have demonstrated strong potential in handling complex feature selection tasks (<xref ref-type="bibr" rid="ref11">Huda and Banka, 2019</xref>; <xref ref-type="bibr" rid="ref33">Tran et al., 2019</xref>; <xref ref-type="bibr" rid="ref28">Swesi and Bakar, 2019</xref>; <xref ref-type="bibr" rid="ref27">Song et al., 2021</xref>; <xref ref-type="bibr" rid="ref31">Too et al., 2019</xref>). These methods mimic social behaviors to search for optimal feature subsets by balancing exploration and exploitation. However, standard PSO- and CSO-based algorithms often face issues such as slow convergence or premature stagnation when applied to datasets with thousands of features (<xref ref-type="bibr" rid="ref7">Ding et al., 2020</xref>; <xref ref-type="bibr" rid="ref32">Tran et al., 2018</xref>; <xref ref-type="bibr" rid="ref21">Pichai et al., 2020</xref>; <xref ref-type="bibr" rid="ref14">Li et al., 2023</xref>). To address these challenges, recent studies have turned to Evolutionary Multitasking (EMT), which leverages the latent synergy among multiple tasks to accelerate search efficiency and improve generalization performance (<xref ref-type="bibr" rid="ref4">Chen et al., 2020</xref>; <xref ref-type="bibr" rid="ref5">Chen et al., 2021</xref>; <xref ref-type="bibr" rid="ref14">Li et al., 2023</xref>). However, most existing EMT-based feature selection methods still rely on fixed task definitions and lack adaptive mechanisms to dynamically construct tasks, evaluate task relevance, and selectively transfer knowledge. As a result, they are prone to negative transfer and limited scalability when applied to ultra-high-dimensional problems. Moreover, they rarely incorporate explicit competition mechanisms to maintain population diversity, which increases the risk of premature convergence.</p>
<p>To address these challenges, a novel dual-task multitask learning with competitive elites (DMLC-MTO) framework is proposed for high-dimensional feature selection. The core idea is to co-optimize a global task that retains the full feature space and an auxiliary task that operates on a reduced subset of features generated by multi-indicator integration. The optimization is driven by a competitive particle swarm mechanism with hierarchical elite learning and inter-task knowledge transfer. This approach aims to balance global exploration and local exploitation while leveraging the shared knowledge across tasks to escape local optima and boost search efficiency. The main contributions of this work are summarized as follows:</p><list list-type="order">
<list-item>
<p>A novel Dual-Task Evolutionary Multitasking Optimization (DMLC-MTO) framework is proposed. It balances global exploration and local exploitation to address redundant features and improve search efficiency in high-dimensional spaces.</p>
</list-item>
<list-item>
<p>A dynamic multi-indicator evaluation strategy is introduced for auxiliary task construction. It combines Relief-F and Fisher Score with adaptive thresholding to resolve indicator conflicts and select informative features.</p>
</list-item>
<list-item>
<p>A hierarchical elite-driven competitive optimization mechanism is designed. It enables intra- and inter-task knowledge transfer to enhance convergence stability and solution quality.</p>
</list-item>
</list>
<p>The remainder of this paper is organized as follows. Section 2 reviews related work on high-dimensional feature selection and multi-task optimization. Section 3 introduces the proposed dynamic multitask learning framework, including the task generation strategy, competitive particle swarm optimization with hierarchical elite learning, and the knowledge transfer mechanism. Section 4 presents experimental results and analysis on benchmark datasets. Finally, Section 5 concludes the paper and discusses future research directions.</p>
</sec>
<sec id="sec2">
<label>2</label>
<title>Related work</title>
<sec id="sec3">
<label>2.1</label>
<title>Problem formulation</title>
<p>Feature selection aims to identify a subset of informative features from a high-dimensional feature space while removing redundant or irrelevant ones. Formally, given a dataset <inline-formula>
<mml:math id="M1">
<mml:mi>D</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:mo stretchy="true">{</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">}</mml:mo>
</mml:math>
</inline-formula>,<inline-formula>
<mml:math id="M2">
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#x22EF;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mi>n</mml:mi>
</mml:math>
</inline-formula>, where <inline-formula>
<mml:math id="M3">
<mml:msub>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mi>&#x211D;</mml:mi>
<mml:mi>d</mml:mi>
</mml:msup>
</mml:math>
</inline-formula>is a feature vector and <inline-formula>
<mml:math id="M4">
<mml:msub>
<mml:mi mathvariant="normal">y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:math>
</inline-formula> is the corresponding label, the objective is to find a binary selection vector <inline-formula>
<mml:math id="M5">
<mml:mi mathvariant="normal">z</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="true">{</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">}</mml:mo>
</mml:mrow>
<mml:mi>d</mml:mi>
</mml:msup>
</mml:math>
</inline-formula> such that the selected subset <inline-formula>
<mml:math id="M6">
<mml:mi>S</mml:mi>
<mml:mo>=</mml:mo>
<mml:mo stretchy="true">{</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo>&#x2223;</mml:mo>
<mml:msub>
<mml:mi>z</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">}</mml:mo>
</mml:math>
</inline-formula>maximizes model performance with minimal feature count. This problem is inherently combinatorial and becomes more challenging as dimensionality increases, especially when feature relevance is sparse or context-dependent.</p>
<p>Due to the exponential number of possible feature subsets, feature selection is considered an NP-hard problem. In high-dimensional scenarios, especially when the number of features greatly exceeds the number of samples, the presence of redundant, noisy, or irrelevant features can severely degrade model performance and increase computational cost. Therefore, effective feature selection is critical for improving model generalization, enhancing interpretability, and reducing overfitting risks in complex learning tasks.</p>
</sec>
<sec id="sec4">
<label>2.2</label>
<title>Related work</title>
<p>Over the past decades, numerous FS algorithms have been developed, which can be broadly categorized into filter, wrapper, and evolutionary-based methods.</p>
<p>Filter methods select features based on their intrinsic properties such as correlation, information entropy, or discriminative power, independent of any classifier. Common approaches include correlation-based feature selection (CFS) (<xref ref-type="bibr" rid="ref10">Hall, 1999</xref>), mutual information (<xref ref-type="bibr" rid="ref34">Vergara and Est&#x00E9;vez, 2014</xref>), and Gini Index (<xref ref-type="bibr" rid="ref26">Solorio et al., 2020</xref>). Relief-F (<xref ref-type="bibr" rid="ref13">Kononenko, 1994</xref>), one of the earliest and most influential methods, ranks features by assessing how well they distinguish between instances of different classes. It demonstrates strong robustness to noise and applicability across different learning models. To alleviate feature redundancy, CFS (<xref ref-type="bibr" rid="ref10">Hall, 1999</xref>) evaluates feature subsets by considering both individual relevance and pairwise correlations. The fast correlation-based filter (FCBF) (<xref ref-type="bibr" rid="ref24">Senliol et al., 2008</xref>) further improves efficiency by rapidly removing redundant features based on entropy-based measures. In more complex scenarios involving mixed-type data, hybrid methods such as SFSDFC (<xref ref-type="bibr" rid="ref36">Yan et al., 2021</xref>) and UFS (<xref ref-type="bibr" rid="ref25">Solorio et al., 2024</xref>) have been proposed to integrate density-based clustering and spectral analysis for robust feature evaluation. Nevertheless, filter methods often suffer from suboptimal feature subset selection due to the lack of interaction with model performance.</p>
<p>Wrapper methods evaluate subsets of features using specific learning algorithms, offering better performance in classification tasks. Sequential forward selection (<xref ref-type="bibr" rid="ref9">Guan et al., 2004</xref>), sequential backward selection (SBS) (<xref ref-type="bibr" rid="ref8">Fern&#x00E1;ndez-Diego and Gonz&#x00E1;lez-Ladr&#x00F3;n-de-Guevara, 2018</xref>), and recursive feature elimination (RFE) (<xref ref-type="bibr" rid="ref20">Paul and Dupont, 2015</xref>) are classical examples. RFE, in particular, uses classifiers such as support vector machines to recursively remove the least important features, delivering high accuracy but with high computational cost. Hybrid and heuristic wrappers have emerged to improve efficiency, including mixed forward selection (MFS) (<xref ref-type="bibr" rid="ref29">Tang and Mao, 2007</xref>), binomial cuckoo search (<xref ref-type="bibr" rid="ref18">Pandey et al., 2020</xref>), and binary Jaya with TOPSIS decision logic (<xref ref-type="bibr" rid="ref2">Chaudhuri and Sahu, 2021</xref>). Metaheuristic-based methods, such as Firefly Algorithm and Hyena Optimization (<xref ref-type="bibr" rid="ref16">Lohitha and Pounambal, 2022</xref>), have also been used to balance search quality and complexity. Although wrapper methods provide better feature subsets, they often become infeasible on large-scale or high-dimensional data due to their high time complexity.</p>
<p>Evolutionary algorithm such as PSO and CSO have been widely adopted for feature selection due to their capability in handling large search spaces (<xref ref-type="bibr" rid="ref11">Huda and Banka, 2019</xref>; <xref ref-type="bibr" rid="ref33">Tran et al., 2019</xref>; <xref ref-type="bibr" rid="ref28">Swesi and Bakar, 2019</xref>; <xref ref-type="bibr" rid="ref27">Song et al., 2021</xref>; <xref ref-type="bibr" rid="ref31">Too et al., 2019</xref>). PSO variants have been enhanced with rough sets (<xref ref-type="bibr" rid="ref11">Huda and Banka, 2019</xref>), adaptive subpopulation strategies (<xref ref-type="bibr" rid="ref33">Tran et al., 2019</xref>), and feature clustering (<xref ref-type="bibr" rid="ref28">Swesi and Bakar, 2019</xref>). Meanwhile, CSO has been improved with binary encoding (<xref ref-type="bibr" rid="ref31">Too et al., 2019</xref>), genetic operators (<xref ref-type="bibr" rid="ref7">Ding et al., 2020</xref>), and chaotic functions (<xref ref-type="bibr" rid="ref21">Pichai et al., 2020</xref>) to increase diversity and convergence speed. In addition, PSO and other metaheuristic-based algorithms have also shown strong adaptability in broader application domains, such as cloud resource forecasting (<xref ref-type="bibr" rid="ref23">Salb et al., 2024</xref>), software defect prediction (<xref ref-type="bibr" rid="ref35">Villoth et al., 2025</xref>), sentiment classification (<xref ref-type="bibr" rid="ref17">Mladenovic et al., 2024</xref>), and intrusion detection in IoT systems (<xref ref-type="bibr" rid="ref6">Dakic et al., 2024</xref>).</p>
<p>However, these methods still suffer from premature convergence and inefficient exploration in ultra-high-dimensional settings. As a response, evolutionary multitasking (EMT) strategies have been introduced to feature selection problems. Chen proposed multitask PSO methods (<xref ref-type="bibr" rid="ref4">Chen et al., 2020</xref>; <xref ref-type="bibr" rid="ref5">Chen et al., 2021</xref>) that convert high-dimensional feature selection into correlated subtasks and facilitate knowledge transfer between them. More recently, Li extended this idea by integrating filter-based indicators to generate diverse auxiliary tasks (<xref ref-type="bibr" rid="ref14">Li et al., 2023</xref>), further improving optimization performance on high-dimensional datasets. However, most existing MTL or transfer-based FS methods still rely on fixed task definitions and lack adaptive mechanisms for dynamic task construction, relevance evaluation, and selective transfer.</p>
<p>In addition, few works consider integrating multiple evaluation criteria to construct feature relevance measures dynamically. The conflict between different indicators (e.g., Relief-F vs. Fisher Score) often leads to inconsistent selection results. Furthermore, evolutionary optimization in multitask FS scenarios still faces challenges such as inefficient exploration, insufficient exploitation of inter-task knowledge, and the risk of negative transfer.</p>
<p>Despite the progress made, several challenges in high-dimensional feature selection remain insufficiently addressed. These include how to construct auxiliary tasks in a data-driven manner using multiple relevance indicators, how to facilitate effective yet selective knowledge transfer between tasks, and how to improve search efficiency without compromising solution quality. This work explores these aspects by proposing a multitask optimization framework that incorporates multi-criteria based task construction, competitive learning with hierarchical elites and elite-based knowledge transfer strategy to enhance the feature selection process.</p>
</sec>
</sec>
<sec id="sec5">
<label>3</label>
<title>The proposed algorithm</title>
<sec id="sec6">
<label>3.1</label>
<title>Main framework of the proposed algorithm</title>
<p>To address the challenges of high-dimensional feature selection, we propose a novel evolutionary multitasking optimization framework, DMLC-MTO (dynamic multitask learning via competitive elites) is proposed. The core idea is to jointly explore the global feature space and exploit locally informative subsets through a dual-task structure, enhanced by elite-guided search.</p>
<p>As illustrated in <xref ref-type="fig" rid="fig1">Figure 1</xref>, DMLC-MTO operates on two complementary tasks. The primary task performs global feature optimization in the full feature space, while the auxiliary task focuses on a reduced subspace constructed via a Multi-Criteria based Task Generation Strategy. This task division allows the algorithm to simultaneously capture broad feature relevance and fine-grained local discriminability.</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>The framework of the proposed DMLC-MTO.</p>
</caption>
<graphic xlink:href="frai-08-1667167-g001.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Flowchart illustrating a two-part process. The first part, "Multi-Criteria Based Task Generation," starts with training data, calculating feature weights using Relief-F and Fisher Score, fusing these weights, rearranging features, and selecting tasks based on feature sets. The second part, "Elite-Guided Competitive Particle Swarm Optimization," initializes the population, splits into subpopulations for different tasks, undergoes competitive learning, and updates velocity using knowledge transfer. Ends with generating an optimal feature subset upon meeting stopping criteria.</alt-text>
</graphic>
</fig>
<p>Both tasks evolve independently through competitive particle swarm optimization but interact dynamically via an elite-based knowledge sharing mechanism. High-quality solutions from one task can influence the search direction of the other, enabling mutual reinforcement and improving convergence behavior. The overall workflow of DMLC-MTO is outlined in <xref ref-type="fig" rid="fig2">Algorithm 1</xref>.</p>
<fig position="float" id="fig2">
<label>ALGORITHM 1</label>
<caption>
<p>DMLC-MTO optimization framework.</p>
</caption>
<graphic xlink:href="frai-08-1667167-g002.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Flowchart detailing a feature selection process: Start with a complete feature set and aim to output a selected subset. Steps include: generating tasks via a multi-criteria strategy; initializing populations for two tasks; evolving tasks using competitive learning with hierarchical elites and knowledge transfer until criteria are met; and finally, returning the best-performing subset.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec7">
<label>3.2</label>
<title>Multi-criteria based task generation strategy</title>
<p>In high-dimensional feature selection, designing an effective auxiliary task is a key challenge for multitask optimization. Naively increasing the number of tasks often leads to unnecessary computational overhead and increases the risk of negative transfer. To address this, DMLC-MTO adopts a two-task paradigm: the primary task operates on the full feature space to ensure global exploration, while the auxiliary task focuses on a compact subset of features to enable refined local optimization. A critical factor in the success of this paradigm is how the auxiliary feature subset is constructed.</p>
<p>Traditional evaluation methods, such as Relief-F and Fisher Score, offer different perspectives on feature importance. Relief-F emphasizes neighborhood-based instance discrimination, while Fisher Score captures between-class variance. However, these approaches often produce inconsistent feature rankings when used independently, particularly in high-dimensional settings where feature redundancy and noise are common. To mitigate these inconsistencies, this work proposes a Multi-Criteria Based Task Generation Strategy that integrates both metrics into a unified scoring framework.</p>
<p>As shown in <xref ref-type="disp-formula" rid="EQ1">Equation 1</xref> the strategy begins by independently computing the importance weights of each feature using both Relief-F and Fisher Score. These two score vectors are then fused using a weighted linear combination.</p><disp-formula id="EQ1">
<label>(1)</label>
<mml:math id="M7">
<mml:msub>
<mml:mi>w</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mi>&#x03B1;</mml:mi>
<mml:mo>&#x22C5;</mml:mo>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi mathvariant="italic">RF</mml:mi>
</mml:msubsup>
<mml:mo>+</mml:mo>
<mml:mi>&#x03B2;</mml:mi>
<mml:mo>&#x22C5;</mml:mo>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi mathvariant="italic">FS</mml:mi>
</mml:msubsup>
</mml:math>
</disp-formula>
<p>Where <inline-formula>
<mml:math id="M8">
<mml:msub>
<mml:mi>w</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mspace width="0em"/>
</mml:math>
</inline-formula>denotes the combined weight of the <italic>i</italic>-th feature, <italic>&#x03B1;</italic> and <italic>&#x03B2;</italic> control the relative contribution of each metric, allowing flexible adjustment based on data characteristics. This yields a comprehensive feature relevance score for each feature.</p>
<p>Instead of arbitrarily selecting a fixed number of features (e.g., top-k), the proposed strategy employs knee point detection to adaptively determine the weight threshold for feature selection, ensuring both focus and relevance. As illustrated in <xref ref-type="fig" rid="fig3">Figure 2</xref>, each feature&#x2019;s score is first calculated and ranked in descending order. A curve is plotted based on these scores, and a straight line is drawn connecting the highest and lowest points. The feature corresponding to the maximum perpendicular distance between the curve and the line, which is the knee point and marked as the red point in <xref ref-type="fig" rid="fig3">Figure 2</xref>, is identified as the selection threshold. Features with scores above this threshold are considered the most significant and are subsequently selected for Task 2.</p>
<fig position="float" id="fig3">
<label>Figure 2</label>
<caption>
<p>Feature score curve and knee point detection for adaptive thresholding.</p>
</caption>
<graphic xlink:href="frai-08-1667167-g003.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Diagram showing feature selection process. A series of features \(W_1, W_2, \ldots, W_n\) are weighted and ranked on a graph with feature weight on the y-axis and feature ranking on the x-axis. A curve illustrates the ranking process, leading to selected features \(F_1, F_3, F_{15}, \ldots, F_k\) for Task 2.</alt-text>
</graphic>
</fig>
<p>This adaptive thresholding technique ensures that the selected features are statistically meaningful and tailored to the data distribution, avoiding arbitrary cutoffs and improving robustness. As a result, Task 2 is constructed using only the features above the knee point, while Task 1 retains the full feature set. This design ensures that the auxiliary task remains focused and efficient, while the primary task provides broader coverage, allowing the multitask optimization process to benefit from both global and fine-grained representations.</p>
</sec>
<sec id="sec8">
<label>3.3</label>
<title>Elite-guided competitive particle swarm optimization</title>
<p>High-dimensional feature selection presents two key challenges for evolutionary algorithms: premature convergence and inefficient exploration. Standard PSO often struggles in such settings, especially when the feature space is sparse or the objective landscape is complex and multimodal. To overcome these limitations, the proposed DMLC-MTO framework incorporates an enhanced optimization strategy called elite-guided competitive PSO (EC-PSO), which integrates competitive learning with hierarchical elites and cross-task knowledge transfer.</p>
<sec id="sec9">
<label>3.3.1</label>
<title>Competitive learning with hierarchical elites</title>
<p>The EC-PSO builds upon the CSO, which introduces pairwise competitions among particles. As shown in <xref ref-type="fig" rid="fig4">Figure 3</xref>, in each generation, particles are randomly grouped into pairs. Within each pair, the particle with superior fitness is marked as the winner, and the other as the loser. The loser updates its velocity and position by learning from the winner and the population centroid, according to <xref ref-type="disp-formula" rid="EQ2">Equations 2</xref>, <xref ref-type="disp-formula" rid="EQ3">3</xref>:</p><disp-formula id="EQ2">
<label>(2)</label>
<mml:math id="M9">
<mml:mtable columnalign="left" displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi mathvariant="normal">V</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>+</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>&#x00D7;</mml:mo>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>&#x00D7;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>W</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">)</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mspace width="4em"/>
<mml:mo>+</mml:mo>
<mml:mi>&#x03C6;</mml:mi>
<mml:mo>&#x00D7;</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">r</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
<mml:mo>&#x00D7;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mover accent="true">
<mml:mi>X</mml:mi>
<mml:mo stretchy="true">&#x00AF;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">)</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:math>
</disp-formula><disp-formula id="EQ3">
<label>(3)</label>
<mml:math id="M10">
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>+</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>+</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</disp-formula><p>where <italic>r</italic><sub>1</sub>,<italic>r</italic><sub>2</sub>,<italic>r</italic><sub>3</sub>&#x2208;[0,1] are random coefficients, <inline-formula>
<mml:math id="M11">
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>W</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>is the winner&#x2019;s position, <inline-formula>
<mml:math id="M12">
<mml:mover accent="true">
<mml:mi>X</mml:mi>
<mml:mo stretchy="true">&#x00AF;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula> is the average position of all particles, and <inline-formula>
<mml:math id="M13">
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>, <inline-formula>
<mml:math id="M14">
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula> denote the velocity and position of the loser, respectively, <inline-formula>
<mml:math id="M15">
<mml:mi>&#x03C6;</mml:mi>
</mml:math>
</inline-formula>controls the influence of <inline-formula>
<mml:math id="M16">
<mml:mover accent="true">
<mml:mi>X</mml:mi>
<mml:mo stretchy="true">&#x00AF;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>. This formulation ensures convergence toward both local optima (through direct winner imitation) and the population mean (to maintain diversity).</p>
<fig position="float" id="fig4">
<label>Figure 3</label>
<caption>
<p>Competition among particles in classical CSO.</p>
</caption>
<graphic xlink:href="frai-08-1667167-g004.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Diagram illustrating a hierarchical structure of labeled data. The top cloud contains blue dots representing concepts. Below, clusters of circles represent paired elements labeled as "w" (red) and "l" (blue), with multiple rows indicating different layers or categories. Arrows indicate relationships, and layers are enclosed in dashed rectangles, labeled as \( w_1 \), \( L_1 \), \( w_2 \), \( L_2 \), and so on.</alt-text>
</graphic>
</fig>
<p>However, standard CSO lacks global guidance and can stagnate when the winner&#x2019;s solution quality plateaus. To enhance the convergence performance in high-dimensional feature selection, DMLC-MTO incorporates an elite-driven competitive learning mechanism. As shown in <xref ref-type="fig" rid="fig5">Figure 4</xref>, in each optimization iteration, the algorithm identifies the top-K best-performing particles in each task to form a task-specific elite pool. After applying the pairwise competition strategy, each loser particle is given a probability &#x1D443;&#x1D458; to learn from a randomly selected particle in the elite pool instead of the winner in its own pair. This elite-level guidance introduces a long-term memory mechanism that directs losers toward globally promising solutions, helping the swarm avoid local stagnation.</p>
<fig position="float" id="fig5">
<label>Figure 4</label>
<caption>
<p>Competitive learning with hierarchical elites.</p>
</caption>
<graphic xlink:href="frai-08-1667167-g005.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Diagram of a competitive learning framework. On the left, an illustration labeled "Competitive Learning" shows a structure with layers L1 and weights w1, using blue and red circles. On the right, labeled "Competitive Learning with Hierarchical Elites," layers E and L1 are shown with yellow and blue circles. The top portion features interconnected cloud shapes, representing information exchange between the two learning paradigms.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec10">
<label>3.3.2</label>
<title>Elite-based knowledge transfer strategy</title>
<p>In multitask optimization, knowledge transfer between tasks plays a vital role in improving overall search performance by sharing successful patterns. To this end, DMLC-MTO introduces a hierarchical elite-based transfer strategy. Specifically, for each loser particle, a random number is generated and compared with a predefined transfer probability &#x1D443;trans. If the transfer condition is satisfied, the particle is allowed to learn from elite solutions of another task, rather than only relying on intra-task updates.</p>
<p>Furthermore, within both intra-task and cross-task settings, the algorithm checks whether another random value exceeds the elite learning threshold &#x1D443;&#x1D458;. If so, the particle learns from an elite particle; otherwise, it learns from the average position of all particles or elites in the corresponding task. The update strategy thus includes four distinct modes as <xref ref-type="disp-formula" rid="EQ4">Equations 4</xref>&#x2013;<xref ref-type="disp-formula" rid="EQ7">7</xref>:</p><disp-formula id="EQ4">
<label>(4)</label>
<mml:math id="M17">
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:msubsup>
<mml:mi mathvariant="normal">V</mml:mi>
<mml:mi>L</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>+</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>&#x00D7;</mml:mo>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>&#x00D7;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msubsup>
<mml:mi>X</mml:mi>
<mml:mtext mathvariant="italic">Erand</mml:mtext>
<mml:mtext mathvariant="italic">task</mml:mtext>
</mml:msubsup>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mi>X</mml:mi>
<mml:mi>L</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">)</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">r</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
<mml:mo>&#x00D7;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mtext mathvariant="italic">Erand</mml:mtext>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">)</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:math>
</disp-formula><disp-formula id="EQ5">
<label>(5)</label>
<mml:math id="M18">
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:msubsup>
<mml:mi mathvariant="normal">V</mml:mi>
<mml:mi>L</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>+</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>&#x00D7;</mml:mo>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>&#x00D7;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msubsup>
<mml:mi>X</mml:mi>
<mml:mi>W</mml:mi>
<mml:mtext mathvariant="italic">task</mml:mtext>
</mml:msubsup>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mi>X</mml:mi>
<mml:mi>L</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">)</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">r</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
<mml:mo>&#x00D7;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mtext mathvariant="italic">wrand</mml:mtext>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">)</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:math>
</disp-formula><disp-formula id="EQ6">
<label>(6)</label>
<mml:math id="M19">
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:mtable>
<mml:mtr>
<mml:mtd>
<mml:msubsup>
<mml:mi mathvariant="normal">V</mml:mi>
<mml:mi>L</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>+</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>&#x00D7;</mml:mo>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>&#x00D7;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msubsup>
<mml:mi>X</mml:mi>
<mml:mtext mathvariant="italic">Erand</mml:mtext>
<mml:mtext mathvariant="italic">task</mml:mtext>
</mml:msubsup>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mi>X</mml:mi>
<mml:mi>L</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">)</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mo>+</mml:mo>
<mml:mi>&#x03C6;</mml:mi>
<mml:mo>&#x00D7;</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">r</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
<mml:mo>&#x00D7;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msubsup>
<mml:mover accent="true">
<mml:mi>X</mml:mi>
<mml:mo stretchy="true">&#x00AF;</mml:mo>
</mml:mover>
<mml:mi>E</mml:mi>
<mml:mtext mathvariant="italic">task</mml:mtext>
</mml:msubsup>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">)</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd/>
</mml:mtr>
</mml:mtable>
</mml:math>
</disp-formula><disp-formula id="EQ7">
<label>(7)</label>
<mml:math id="M20">
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:msubsup>
<mml:mi mathvariant="normal">V</mml:mi>
<mml:mi>L</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>+</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>&#x00D7;</mml:mo>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>&#x00D7;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:msubsup>
<mml:mi>X</mml:mi>
<mml:mi>W</mml:mi>
<mml:mtext mathvariant="italic">task</mml:mtext>
</mml:msubsup>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mi>X</mml:mi>
<mml:mi>L</mml:mi>
<mml:mi>i</mml:mi>
</mml:msubsup>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">)</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mo>+</mml:mo>
<mml:mi>&#x03C6;</mml:mi>
<mml:mo>&#x00D7;</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">r</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
<mml:mo>&#x00D7;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mover accent="true">
<mml:mi>X</mml:mi>
<mml:mo stretchy="true">&#x00AF;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo stretchy="true">)</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:math>
</disp-formula>
<p>Where <inline-formula>
<mml:math id="M21">
<mml:msubsup>
<mml:mi>X</mml:mi>
<mml:mtext mathvariant="italic">Erand</mml:mtext>
<mml:mtext mathvariant="italic">task</mml:mtext>
</mml:msubsup>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>a particle randomly selected from the elite pool within the current task, while <inline-formula>
<mml:math id="M22">
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mtext mathvariant="italic">Erand</mml:mtext>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>is randomly chosen from the elite pool of other tasks, <inline-formula>
<mml:math id="M23">
<mml:msubsup>
<mml:mi>X</mml:mi>
<mml:mi>W</mml:mi>
<mml:mtext mathvariant="italic">task</mml:mtext>
</mml:msubsup>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>denotes the winner particle within the same task, <inline-formula>
<mml:math id="M24">
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mtext mathvariant="italic">wrand</mml:mtext>
</mml:msub>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>is a randomly selected winner from other tasks, represents the average position of elites in the current task, <inline-formula>
<mml:math id="M25">
<mml:mover accent="true">
<mml:mi>X</mml:mi>
<mml:mo stretchy="true">&#x00AF;</mml:mo>
</mml:mover>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>denotes the average position of all particles in the current population, <inline-formula>
<mml:math id="M26">
<mml:mi>&#x03C6;</mml:mi>
</mml:math>
</inline-formula>serves as a control factor to regulate the influence of the corresponding learning component. From <xref ref-type="disp-formula" rid="EQ4 EQ5 EQ6 EQ7">Equations 4&#x2013;7</xref>, it can be observed that each particle updates its position by simultaneously learning from two types of sources. By incorporating knowledge from the winner in the same task, the winner from another task, the average position of elite particles within the current task, and the overall population mean, the particle significantly enhances its search capability. This design helps maintain population diversity and improves optimization efficiency.</p>
</sec>
</sec>
<sec id="sec11">
<label>3.4</label>
<title>Fitness function</title>
<p>An effective fitness function plays a vital role in guiding the evolutionary search toward an optimal feature subset. In this study, we adopt an evaluation strategy that considers both classification performance and feature compactness is adopted. The overall fitness function is defined as <xref ref-type="disp-formula" rid="EQ8">Equations 8</xref>, <xref ref-type="disp-formula" rid="EQ9">9</xref>:</p><disp-formula id="EQ8">
<label>(8)</label>
<mml:math id="M27">
<mml:mtext mathvariant="italic">fitness</mml:mtext>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>&#x03B1;</mml:mi>
<mml:mi>f</mml:mi>
</mml:msub>
<mml:mo>&#x2217;</mml:mo>
<mml:mi mathvariant="italic">&#x03B3;R</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>D</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>&#x03B1;</mml:mi>
<mml:mi>f</mml:mi>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>&#x2217;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mo>&#x2223;</mml:mo>
<mml:mi>S</mml:mi>
<mml:mo>&#x2223;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2223;</mml:mo>
<mml:mi>N</mml:mi>
<mml:mo>&#x2223;</mml:mo>
</mml:mrow>
</mml:mfrac>
</mml:math>
</disp-formula><disp-formula id="EQ9">
<label>(9)</label>
<mml:math id="M28">
<mml:mi mathvariant="italic">&#x03B3;R</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>D</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>C</mml:mi>
</mml:mfrac>
<mml:mo>&#x2217;</mml:mo>
<mml:munderover>
<mml:mo movablelimits="false">&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>C</mml:mi>
</mml:munderover>
<mml:msub>
<mml:mi mathvariant="italic">TPR</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:math>
</disp-formula>
<p>Where <inline-formula>
<mml:math id="M29">
<mml:mi mathvariant="italic">&#x03B3;R</mml:mi>
<mml:mo stretchy="true">(</mml:mo>
<mml:mi>D</mml:mi>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>denotes the probability of classification error. The term <inline-formula>
<mml:math id="M30">
<mml:mo>&#x2223;</mml:mo>
<mml:mi>S</mml:mi>
<mml:mo>&#x2223;</mml:mo>
</mml:math>
</inline-formula>indicates the number of selected features used to construct the model, while <inline-formula>
<mml:math id="M31">
<mml:mo>&#x2223;</mml:mo>
<mml:mi>N</mml:mi>
<mml:mo>&#x2223;</mml:mo>
</mml:math>
</inline-formula>corresponds to the total number of available features in the dataset. The parameter <inline-formula>
<mml:math id="M32">
<mml:msub>
<mml:mi>&#x03B1;</mml:mi>
<mml:mi>f</mml:mi>
</mml:msub>
</mml:math>
</inline-formula>, ranging between 0 and 1, controls the trade-off between classification accuracy and feature sparsity. Following the recommendation in <xref ref-type="bibr" rid="ref3">Chen et al. (2019)</xref>, <italic>&#x03B1;</italic> is set as 0.999999 to place a stronger emphasis on classification performance. The number of classes C reflects the total distinct categories involved in the classification task. For each class <italic>i</italic>, the true positive rate <inline-formula>
<mml:math id="M33">
<mml:msub>
<mml:mi mathvariant="italic">TPR</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:math>
</inline-formula>is computed as the proportion of correctly predicted instances within that class relative to the total number of samples in the same class (<xref ref-type="bibr" rid="ref19">Patterson and Zhang, 2007</xref>). Using the balanced error metric mitigates the influence of class imbalance, ensuring that all classes contribute equally to the evaluation. This is particularly important in feature selection, where biased evaluation can lead to overfitting to majority classes and suboptimal feature subsets.</p>
</sec>
</sec>
<sec id="sec12">
<label>4</label>
<title>Experimental results and analysis</title>
<sec id="sec13">
<label>4.1</label>
<title>Experimental setup</title>
<p>To comprehensively evaluate the performance of the proposed algorithm, experiments were conducted on 13 high-dimensional real-world datasets drawn from various application domains. These datasets exhibit a wide range of feature dimensions, varying from 2,000 to over 13,000, making them suitable for assessing the algorithm&#x2019;s effectiveness under diverse and complex conditions. Detailed characteristics of each dataset&#x2014;including the dataset name, number of features, number of samples, and number of classes&#x2014;are summarized in <xref ref-type="table" rid="tab1">Table 1</xref>.</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>Dataset.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">No.</th>
<th align="left" valign="top">Dataset</th>
<th align="center" valign="top">Feature no.</th>
<th align="center" valign="top">Instance no.</th>
<th align="center" valign="top">Class no.</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">1</td>
<td align="left" valign="middle">SRBCT</td>
<td align="center" valign="middle">2,308</td>
<td align="center" valign="middle">83</td>
<td align="center" valign="middle">4</td>
</tr>
<tr>
<td align="left" valign="middle">2</td>
<td align="left" valign="middle">warpPIE10P</td>
<td align="center" valign="middle">2,420</td>
<td align="center" valign="middle">210</td>
<td align="center" valign="middle">10</td>
</tr>
<tr>
<td align="left" valign="middle">3</td>
<td align="left" valign="middle">Lymphoma</td>
<td align="center" valign="middle">5,026</td>
<td align="center" valign="middle">62</td>
<td align="center" valign="middle">3</td>
</tr>
<tr>
<td align="left" valign="middle">4</td>
<td align="left" valign="middle">Nci</td>
<td align="center" valign="middle">5,244</td>
<td align="center" valign="middle">61</td>
<td align="center" valign="middle">8</td>
</tr>
<tr>
<td align="left" valign="middle">5</td>
<td align="left" valign="middle">Leukemia 1</td>
<td align="center" valign="middle">5,327</td>
<td align="center" valign="middle">72</td>
<td align="center" valign="middle">3</td>
</tr>
<tr>
<td align="left" valign="middle">6</td>
<td align="left" valign="middle">DLBCL</td>
<td align="center" valign="middle">5,469</td>
<td align="center" valign="middle">77</td>
<td align="center" valign="middle">2</td>
</tr>
<tr>
<td align="left" valign="middle">7</td>
<td align="left" valign="middle">Prostate6033</td>
<td align="center" valign="middle">6,033</td>
<td align="center" valign="middle">102</td>
<td align="center" valign="middle">2</td>
</tr>
<tr>
<td align="left" valign="middle">8</td>
<td align="left" valign="middle">ALLAML</td>
<td align="center" valign="middle">7,129</td>
<td align="center" valign="middle">72</td>
<td align="center" valign="middle">2</td>
</tr>
<tr>
<td align="left" valign="middle">9</td>
<td align="left" valign="middle">Nci9</td>
<td align="center" valign="middle">9,712</td>
<td align="center" valign="middle">60</td>
<td align="center" valign="middle">9</td>
</tr>
<tr>
<td align="left" valign="middle">10</td>
<td align="left" valign="middle">Orlraws10P</td>
<td align="center" valign="middle">10,304</td>
<td align="center" valign="middle">100</td>
<td align="center" valign="middle">10</td>
</tr>
<tr>
<td align="left" valign="middle">11</td>
<td align="left" valign="middle">Prostate</td>
<td align="center" valign="middle">10,509</td>
<td align="center" valign="middle">102</td>
<td align="center" valign="middle">2</td>
</tr>
<tr>
<td align="left" valign="middle">12</td>
<td align="left" valign="middle">Leukemia 2</td>
<td align="center" valign="middle">11,225</td>
<td align="center" valign="middle">72</td>
<td align="center" valign="middle">3</td>
</tr>
<tr>
<td align="left" valign="middle">13</td>
<td align="left" valign="middle">Lung cancer</td>
<td align="center" valign="middle">12,600</td>
<td align="center" valign="middle">203</td>
<td align="center" valign="middle">5</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>To evaluate the effectiveness of the proposed DMLC-MTO algorithm, comprehensive comparisons were conducted with four competitive evolutionary algorithm EA-based feature selection methods: PSO (<xref ref-type="bibr" rid="ref1">Ansari et al., 2019</xref>), CSO-FS (<xref ref-type="bibr" rid="ref30">Tian et al., 2019</xref>), PSO-EMT (<xref ref-type="bibr" rid="ref4">Chen et al., 2020</xref>), and MT-PSO (<xref ref-type="bibr" rid="ref5">Chen et al., 2021</xref>). PSO serves as a baseline representing standard EA strategies, while CSO-FS incorporates the traditional CSO search mechanism specifically designed for feature selection. PSO-EMT and MT-PSO both adopt multitask learning paradigms to better address the challenges of high-dimensional feature spaces, and have demonstrated competitive performance in previous studies. All experiments were implemented in MATLAB R2020a and executed on a Windows 10 machine with a 2.6&#x202F;GHz Intel Core i5 processor and 16GB RAM, ensuring a consistent computational environment across all methods. To prevent feature selection bias and ensure an unbiased evaluation, feature selection was performed separately within each training fold during cross-validation. Specifically, for each fold, the training data was used to generate tasks and perform feature selection, and the resulting selected features were then applied to the held-out test fold for performance evaluation. This nested-like procedure ensures that no information from the test set is used during feature selection, thereby providing a reliable estimate of the algorithm&#x2019;s generalization performance.</p>
<p>In addition to these methods, this work included a baseline classifier without any feature selection (referred to as FULL) to highlight the improvements achieved by each FS approach in terms of classification accuracy and dimensionality reduction. All experimental results were obtained from 30 independent runs to account for algorithmic stochasticity. For statistical validation, the Wilcoxon signed-rank test was applied at a significance level of 0.05. In the analysis, the symbols &#x201C;+,&#x201D; &#x201C;&#x2212;,&#x201D; and &#x201C;=&#x201D; denote that a comparison method performs significantly better, worse, or comparable to the proposed DMLC-MTO, respectively.</p>
<p>To ensure fair and consistent comparisons, all algorithms were evaluated under standardized experimental settings. Each task was executed with a population size of 70 and a maximum of 100 iterations. Additionally, the proposed algorithm is model-agnostic and compatible with various classifiers, making it adaptable to different application scenarios without restricting the choice of classification models. The complete parameter configurations for all methods are summarized in <xref ref-type="table" rid="tab2">Table 2</xref> to support reproducibility and facilitate future implementation.</p>
<table-wrap position="float" id="tab2">
<label>Table 2</label>
<caption>
<p>Algorithms parameters setting.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Algorithms</th>
<th align="left" valign="top">Parameters</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">PSO</td>
<td align="left" valign="middle">
<inline-formula>
<mml:math id="M34">
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>1.49445</mml:mn>
</mml:math>
</inline-formula>
<break/>
<inline-formula>
<mml:math id="M35">
<mml:mi>w</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>0.9</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>0.5</mml:mn>
<mml:mo>&#x00D7;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mtext mathvariant="italic">iter</mml:mtext>
<mml:mo>/</mml:mo>
<mml:msub>
<mml:mi>n</mml:mi>
<mml:mtext mathvariant="italic">iter</mml:mtext>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td align="left" valign="middle">CSO-FS</td>
<td align="left" valign="middle">
<inline-formula>
<mml:math id="M36">
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:mo stretchy="true">[</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">]</mml:mo>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td align="left" valign="middle">PSO-EMT</td>
<td align="left" valign="middle">
<inline-formula>
<mml:math id="M37">
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>1.49445</mml:mn>
<mml:mo>,</mml:mo>
<mml:mi>&#x03C1;</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>0.05</mml:mn>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="italic">rmp</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>0.6</mml:mn>
<mml:mo>,</mml:mo>
<mml:mi>m</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>10</mml:mn>
</mml:math>
</inline-formula>
<break/>
<inline-formula>
<mml:math id="M38">
<mml:mi>w</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>0.9</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>0.5</mml:mn>
<mml:mo>&#x00D7;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mtext mathvariant="italic">iter</mml:mtext>
<mml:mo>/</mml:mo>
<mml:msub>
<mml:mi>n</mml:mi>
<mml:mtext mathvariant="italic">iter</mml:mtext>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td align="left" valign="middle">MT-PSO</td>
<td align="left" valign="middle">
<inline-formula>
<mml:math id="M39">
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>1.49445</mml:mn>
<mml:mo>,</mml:mo>
<mml:mi>&#x03C1;</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>0.05</mml:mn>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="italic">rmp</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>0.6</mml:mn>
<mml:mo>,</mml:mo>
<mml:mi>G</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>6</mml:mn>
</mml:math>
</inline-formula>
<break/>
<inline-formula>
<mml:math id="M40">
<mml:mi>w</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>0.9</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>0.5</mml:mn>
<mml:mo>&#x00D7;</mml:mo>
<mml:mo stretchy="true">(</mml:mo>
<mml:mtext mathvariant="italic">iter</mml:mtext>
<mml:mo>/</mml:mo>
<mml:msub>
<mml:mi>n</mml:mi>
<mml:mtext mathvariant="italic">iter</mml:mtext>
</mml:msub>
<mml:mo stretchy="true">)</mml:mo>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td align="left" valign="middle">DMLC-MTO</td>
<td align="left" valign="middle"><inline-formula>
<mml:math id="M41">
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:mo stretchy="true">[</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo stretchy="true">]</mml:mo>
</mml:math>
</inline-formula><break/><inline-formula>
<mml:math id="M42">
<mml:mi>P</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>0.6</mml:mn>
</mml:math>
</inline-formula><break/><italic>Pk</italic> =&#x202F;0.6<break/><inline-formula>
<mml:math id="M43">
<mml:msub>
<mml:mi>&#x03B1;</mml:mi>
<mml:mi>f</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>0.999999</mml:mn>
</mml:math>
</inline-formula></td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec14">
<label>4.2</label>
<title>Comparison with the state-of-the-art algorithms</title>
<sec id="sec15">
<label>4.2.1</label>
<title>Classification accuracy comparison</title>
<p><xref ref-type="table" rid="tab3">Table 3</xref> presents the classification accuracy of DMLC-MTO compared to four baseline algorithms across multiple datasets. Among 65 comparisons, DMLC-MTO outperforms the other methods in 56 cases, achieves comparable results in 8, and underperforms in only 1 case. These results demonstrate the overall superiority and robustness of the proposed method. A detailed analysis is as follows:</p>
<table-wrap position="float" id="tab3">
<label>Table 3</label>
<caption>
<p>Classification accuracy of the compared algorithms on multiple datasets.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Dataset</th>
<th align="center" valign="top">FULL</th>
<th align="center" valign="top">PSO</th>
<th align="center" valign="top">CSO-FS</th>
<th align="center" valign="top">PSO-EMT</th>
<th align="center" valign="top">MT-PSO</th>
<th align="center" valign="top">DMLC-MTO</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">SRBCT</td>
<td align="center" valign="middle">80 (&#x2212;)</td>
<td align="center" valign="middle">95.27 (=)</td>
<td align="center" valign="middle">95.13 (=)</td>
<td align="center" valign="middle">95.12 (=)</td>
<td align="center" valign="middle">95.21 (=)</td>
<td align="center" valign="middle"><bold>95.3</bold></td>
</tr>
<tr>
<td align="left" valign="middle">warpPIE10P</td>
<td align="center" valign="middle">83.58 (&#x2212;)</td>
<td align="center" valign="middle">98.17 (&#x2212;)</td>
<td align="center" valign="middle">51.54 (&#x2212;)</td>
<td align="center" valign="middle">99.12 (=)</td>
<td align="center" valign="middle">99.21 (=)</td>
<td align="center" valign="middle"><bold>99.13</bold></td>
</tr>
<tr>
<td align="left" valign="middle">Lymphoma</td>
<td align="center" valign="middle">99.08 (&#x2212;)</td>
<td align="center" valign="middle">81.35 (&#x2212;)</td>
<td align="center" valign="middle">55.14 (&#x2212;)</td>
<td align="center" valign="middle">93.26 (&#x2212;)</td>
<td align="center" valign="middle">96.51 (&#x2212;)</td>
<td align="center" valign="middle"><bold>99.22</bold></td>
</tr>
<tr>
<td align="left" valign="middle">Nci</td>
<td align="center" valign="middle">66.46 (&#x2212;)</td>
<td align="center" valign="middle">65.36 (&#x2212;)</td>
<td align="center" valign="middle">64.12 (&#x2212;)</td>
<td align="center" valign="middle">59.32 (&#x2212;)</td>
<td align="center" valign="middle">63.87 (&#x2212;)</td>
<td align="center" valign="middle"><bold>68.98</bold></td>
</tr>
<tr>
<td align="left" valign="middle">Leukemia 1</td>
<td align="center" valign="middle">78.74 (&#x2212;)</td>
<td align="center" valign="middle">80.47 (&#x2212;)</td>
<td align="center" valign="middle">81.27 (&#x2212;)</td>
<td align="center" valign="middle">86.08 (&#x2212;)</td>
<td align="center" valign="middle">86.12 (&#x2212;)</td>
<td align="center" valign="middle"><bold>87.86</bold></td>
</tr>
<tr>
<td align="left" valign="middle">DLBCL</td>
<td align="center" valign="middle">82.79 (&#x2212;)</td>
<td align="center" valign="middle">83.72 (&#x2212;)</td>
<td align="center" valign="middle">83.92 (&#x2212;)</td>
<td align="center" valign="middle">85.17 (&#x2212;)</td>
<td align="center" valign="middle">87.67 (&#x2212;)</td>
<td align="center" valign="middle"><bold>89.78</bold></td>
</tr>
<tr>
<td align="left" valign="middle">Prostate6033</td>
<td align="center" valign="middle">82.11 (&#x2212;)</td>
<td align="center" valign="middle">84.07 (&#x2212;)</td>
<td align="center" valign="middle">83.68 (&#x2212;)</td>
<td align="center" valign="middle">80.57 (&#x2212;)</td>
<td align="center" valign="middle">84.07 (&#x2212;)</td>
<td align="center" valign="middle"><bold>86.66</bold></td>
</tr>
<tr>
<td align="left" valign="middle">ALLAML</td>
<td align="center" valign="middle">78.06 (&#x2212;)</td>
<td align="center" valign="middle">79.44 (&#x2212;)</td>
<td align="center" valign="middle">82.02 (&#x2212;)</td>
<td align="center" valign="middle">89.9 (&#x2212;)</td>
<td align="center" valign="middle">91.16 (&#x2212;)</td>
<td align="center" valign="middle"><bold>94.1</bold></td>
</tr>
<tr>
<td align="left" valign="middle">Nci9</td>
<td align="center" valign="middle">41.3 (&#x2212;)</td>
<td align="center" valign="middle">47.32 (&#x2212;)</td>
<td align="center" valign="middle">43.34 (&#x2212;)</td>
<td align="center" valign="middle">51.11 (=)</td>
<td align="center" valign="middle">51.21 (=)</td>
<td align="center" valign="middle"><bold>51.15</bold></td>
</tr>
<tr>
<td align="left" valign="middle">Orlraws10P</td>
<td align="center" valign="middle">78.32 (&#x2212;)</td>
<td align="center" valign="middle">90.84 (&#x2212;)</td>
<td align="center" valign="middle">92.09 (&#x2212;)</td>
<td align="center" valign="middle">93.37 (&#x2212;)</td>
<td align="center" valign="middle">93.18 (&#x2212;)</td>
<td align="center" valign="middle"><bold>98.2</bold></td>
</tr>
<tr>
<td align="left" valign="middle">Prostate</td>
<td align="center" valign="middle">84.34 (&#x2212;)</td>
<td align="center" valign="middle">82.65 (&#x2212;)</td>
<td align="center" valign="middle"><bold>88.36 (=)</bold></td>
<td align="center" valign="middle">81.68 (&#x2212;)</td>
<td align="center" valign="middle">84.17 (&#x2212;)</td>
<td align="center" valign="middle">88.38</td>
</tr>
<tr>
<td align="left" valign="middle">Leukemia 2</td>
<td align="center" valign="middle">87.68 (&#x2212;)</td>
<td align="center" valign="middle">87.15 (&#x2212;)</td>
<td align="center" valign="middle">85.46 (&#x2212;)</td>
<td align="center" valign="middle">87.16 (&#x2212;)</td>
<td align="center" valign="middle">86.45 (&#x2212;)</td>
<td align="center" valign="middle"><bold>88.12</bold></td>
</tr>
<tr>
<td align="left" valign="middle">Lung cancer</td>
<td align="center" valign="middle">77.65 (&#x2212;)</td>
<td align="center" valign="middle">78.41 (&#x2212;)</td>
<td align="center" valign="middle">78.47 (&#x2212;)</td>
<td align="center" valign="middle">83.47 (&#x2212;)</td>
<td align="center" valign="middle">84.75 (&#x2212;)</td>
<td align="center" valign="middle"><bold>87.22</bold></td>
</tr>
<tr>
<td align="left" valign="middle">+/&#x2212;/=</td>
<td align="center" valign="middle">0/13/0</td>
<td align="center" valign="middle">0/12/1</td>
<td align="center" valign="middle">1/11/1</td>
<td align="center" valign="middle">0/10/3</td>
<td align="center" valign="middle">0/10/3</td>
<td/>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Best results are highlighted in bold.</p>
</table-wrap-foot>
</table-wrap>
<p>Compared with FULL: DMLC-MTO consistently outperforms the baseline classifier without feature selection (FULL) on all 13 datasets, highlighting the necessity and effectiveness of feature selection. For example, on the NCI9 dataset, DMLC-MTO achieves an accuracy of 68.98%, improving upon FULL&#x2019;s 66.46% by 3.8%. On the high-dimensional Prostate6033 dataset, DMLC-MTO reaches 86.66%, surpassing FULL&#x2019;s 82.11% by 5.54%. These improvements suggest that assigning discriminative weights to features effectively mitigates the curse of dimensionality and enhances classification performance.</p>
<p>Compared with PSO: DMLC-MTO significantly outperforms standard PSO on 12 out of 13 datasets, with the only tie occurring on the SRBCT dataset (95.3% vs. 95.27%). On the Lymphoma dataset, DMLC-MTO achieves 99.22%, markedly higher than PSO&#x2019;s 81.35%, a relative improvement of 21.97%. Similarly, it reaches 98.2% on the Orlraws10P dataset, outperforming PSO&#x2019;s 90.84% by 7.5%.</p>
<p>Compared with CSO-FS: DMLC-MTO exhibits clear advantages over CSO-FS, achieving better performance on 11 out of 16 datasets, with only one dataset where it performs slightly worse and the rest showing comparable results. On average, DMLC-MTO improves classification accuracy by 11.55 percentage points over CSO-FS. This gain underscores the effectiveness of the multitask framework and the embedded elite-driven competition mechanism in improving feature selection.</p>
<p>Compared with PSO-EMT: DMLC-MTO outperforms PSO-EMT on 10 out of 13 datasets, with equivalent performance on NCI9, Prostate6033, and one additional dataset. For example, it achieves 99.22% accuracy on Lymphoma, exceeding PSO-EMT&#x2019;s 93.26% by 6.4%, and obtains 89.78% on DLBCL, outperforming PSO-EMT&#x2019;s 85.17% by 5.4%. These improvements are largely attributed to the hierarchical elite learning strategy, which dynamically guides the search towards more informative feature subsets.</p>
<p>Compared with MT-PSO: DMLC-MTO achieves superior accuracy on 10 out of 13 datasets compared to MT-PSO, with tied performance on NCI9, Prostate6033, and one other dataset. On the ALLAML dataset, DMLC-MTO reaches 94.1%, improving upon MT-PSO&#x2019;s 91.16% by 3.2%. On Lung Cancer, it records 87.22% versus 84.75% by MT-PSO, a relative gain of 2.9%. These results validate the advantage of DMLC-MTO&#x2019;s multi-indicator-based task generation strategy, which constructs complementary tasks more effectively than MT-PSO&#x2019;s random task allocation approach.</p>
</sec>
<sec id="sec16">
<label>4.2.2</label>
<title>Analysis of selected feature subsets</title>
<p><xref ref-type="table" rid="tab4">Table 4</xref> reports the number of features selected by different algorithms across all datasets. Reducing the number of selected features often leads to simpler models and improved computational efficiency. The experimental results show that DMLC-MTO consistently selects fewer features than other methods. Among 65 comparisons, it outperforms its competitors in 59 cases, ties in 4, and underperforms in only 3, demonstrating its strong capability in identifying compact and informative feature subsets.</p>
<table-wrap position="float" id="tab4">
<label>Table 4</label>
<caption>
<p>Number of features selected by different algorithms on multiple datasets.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Dataset</th>
<th align="center" valign="top">FULL</th>
<th align="center" valign="top">PSO</th>
<th align="center" valign="top">CSO-FS</th>
<th align="center" valign="top">PSO-EMT</th>
<th align="center" valign="top">MT-PSO</th>
<th align="center" valign="top">DMLC-MTO</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">SRCBT</td>
<td align="center" valign="middle">2,308</td>
<td align="center" valign="middle">295.25 (&#x2212;)</td>
<td align="center" valign="middle">150.2 (&#x2212;)</td>
<td align="center" valign="middle">122.4 (&#x2212;)</td>
<td align="center" valign="middle">452.6 (&#x2212;)</td>
<td align="center" valign="middle"><bold>47.18</bold></td>
</tr>
<tr>
<td align="left" valign="middle">warpPIE10P</td>
<td align="center" valign="middle">2,420</td>
<td align="center" valign="middle">1185.5 (&#x2212;)</td>
<td align="center" valign="middle"><bold>8.5 (+)</bold></td>
<td align="center" valign="middle">155.67 (&#x2212;)</td>
<td align="center" valign="middle">288.6 (&#x2212;)</td>
<td align="center" valign="middle">32.52</td>
</tr>
<tr>
<td align="left" valign="middle">Lymphoma</td>
<td align="center" valign="middle">4,026</td>
<td align="center" valign="middle">2155.1 (&#x2212;)</td>
<td align="center" valign="middle"><bold>3.5 (+)</bold></td>
<td align="center" valign="middle">12.52 (+)</td>
<td align="center" valign="middle">21.99 (&#x2212;)</td>
<td align="center" valign="middle">56.39</td>
</tr>
<tr>
<td align="left" valign="middle">Nci</td>
<td align="center" valign="middle">5,244</td>
<td align="center" valign="middle">2064.8 (&#x2212;)</td>
<td align="center" valign="middle">412.8 (&#x2212;)</td>
<td align="center" valign="middle">316.74 (&#x2212;)</td>
<td align="center" valign="middle">1203.47 (&#x2212;)</td>
<td align="center" valign="middle"><bold>282.12</bold></td>
</tr>
<tr>
<td align="left" valign="middle">Leukemia 1</td>
<td align="center" valign="middle">5,327</td>
<td align="center" valign="middle">2953.4 (&#x2212;)</td>
<td align="center" valign="middle">435.2 (&#x2212;)</td>
<td align="center" valign="middle">282.5 (&#x2212;)</td>
<td align="center" valign="middle">842.56 (&#x2212;)</td>
<td align="center" valign="middle"><bold>230.22</bold></td>
</tr>
<tr>
<td align="left" valign="middle">DLBCL</td>
<td align="center" valign="middle">5,469</td>
<td align="center" valign="middle">2154.7 (&#x2212;)</td>
<td align="center" valign="middle">332.25 (&#x2212;)</td>
<td align="center" valign="middle">194.4 (=)</td>
<td align="center" valign="middle">1025.27 (&#x2212;)</td>
<td align="center" valign="middle">200.22</td>
</tr>
<tr>
<td align="left" valign="middle">Prostate6033</td>
<td align="center" valign="middle">6,033</td>
<td align="center" valign="middle">3158.4 (&#x2212;)</td>
<td align="center" valign="middle">780.54 (&#x2212;)</td>
<td align="center" valign="middle">462.36 (&#x2212;)</td>
<td align="center" valign="middle">1451.12 (&#x2212;)</td>
<td align="center" valign="middle"><bold>113.82</bold></td>
</tr>
<tr>
<td align="left" valign="middle">ALLAML</td>
<td align="center" valign="middle">7,129</td>
<td align="center" valign="middle">3834.1 (&#x2212;)</td>
<td align="center" valign="middle">392.5 (&#x2212;)</td>
<td align="center" valign="middle">162.82 (&#x2212;)</td>
<td align="center" valign="middle">1852.22 (&#x2212;)</td>
<td align="center" valign="middle"><bold>79.93</bold></td>
</tr>
<tr>
<td align="left" valign="middle">Nci9</td>
<td align="center" valign="middle">9,712</td>
<td align="center" valign="middle">4426.1 (&#x2212;)</td>
<td align="center" valign="middle">618.4 (+)</td>
<td align="center" valign="middle">1932.7 (=)</td>
<td align="center" valign="middle">613.28 (+)</td>
<td align="center" valign="middle">1947.22</td>
</tr>
<tr>
<td align="left" valign="middle">Orlraws10P</td>
<td align="center" valign="middle">10,304</td>
<td align="center" valign="middle">4834.9 (&#x2212;)</td>
<td align="center" valign="middle">65.4 (=)</td>
<td align="center" valign="middle">932.86 (&#x2212;)</td>
<td align="center" valign="middle">1208.04 (&#x2212;)</td>
<td align="center" valign="middle"><bold>63.28</bold></td>
</tr>
<tr>
<td align="left" valign="middle">Prostate</td>
<td align="center" valign="middle">10,509</td>
<td align="center" valign="middle">5675.5 (&#x2212;)</td>
<td align="center" valign="middle">1305.4 (&#x2212;)</td>
<td align="center" valign="middle">185.12 (&#x2212;)</td>
<td align="center" valign="middle">2759.71 (&#x2212;)</td>
<td align="center" valign="middle"><bold>231.32</bold></td>
</tr>
<tr>
<td align="left" valign="middle">Leukemia 2</td>
<td align="center" valign="middle">11,225</td>
<td align="center" valign="middle">3548.1 (&#x2212;)</td>
<td align="center" valign="middle">1057.6 (&#x2212;)</td>
<td align="center" valign="middle">298.3 (=)</td>
<td align="center" valign="middle">1587.2 (&#x2212;)</td>
<td align="center" valign="middle"><bold>285.58</bold></td>
</tr>
<tr>
<td align="left" valign="middle">Lung cancer</td>
<td align="center" valign="middle">12,600</td>
<td align="center" valign="middle">6923.8 (&#x2212;)</td>
<td align="center" valign="middle">1168.4 (&#x2212;)</td>
<td align="center" valign="middle">753.38 (&#x2212;)</td>
<td align="center" valign="middle">832.4 (&#x2212;)</td>
<td align="center" valign="middle"><bold>322.48</bold></td>
</tr>
<tr>
<td align="left" valign="middle">+/&#x2212;/=</td>
<td/>
<td align="center" valign="middle">0/13/0</td>
<td align="center" valign="middle">2/9/2</td>
<td align="center" valign="middle">1/11/1</td>
<td align="center" valign="middle">0/12/1</td>
<td/>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Best results are highlighted in bold.</p>
</table-wrap-foot>
</table-wrap>
<p>On high-dimensional datasets such as Orlraws10P and Lung Cancer (with over 10,000 dimensions), DMLC-MTO achieves significant dimensionality reduction while maintaining high classification accuracy. This demonstrates not only its effectiveness in compressing features, but also its ability to filter out redundant or irrelevant attributes and retain the most discriminative ones. Such compact representations are particularly beneficial in practical scenarios where computational resources are limited or real-time decision-making is required. Moreover, reducing the number of features improves model interpretability, which is critical in domains like healthcare and bioinformatics.</p>
<p>Although DMLC-MTO performs well on most datasets, there are a few cases where its classification accuracy is slightly lower than that of CSO-FS. For instance, on the Prostate dataset, DMLC-MTO selects an average of 132.13 features compared to 1305.4 selected by CSO-FS. Despite selecting far fewer features, DMLC-MTO&#x2019;s accuracy is marginally lower. This may be attributed to its limited ability to capture complex nonlinear dependencies between features when relying on filter-based metrics like Fisher Score. Furthermore, the competitive learning mechanism may occasionally introduce negative transfer, where informative features are prematurely discarded in early stages of optimization, slightly affecting final performance.</p>
<p>Nonetheless, the global search capability of DMLC-MTO ensures that it can still find effective solutions with fewer features. On datasets such as warpPIE10P and Lymphoma, where CSO-FS selects fewer features (8.5 and 3.5, respectively), it achieves only 51.54% and 55.14% accuracy. In contrast, DMLC-MTO selects slightly more features (34.57 and 86.74, respectively), yet reaches significantly higher accuracies of 99.56% and 99.36%. These results highlight the strength of DMLC-MTO&#x2019;s dual-task and elite-guided learning mechanisms in discovering high-quality feature combinations that lead to better overall performance.</p>
<p>In summary, DMLC-MTO shows great potential for high-dimensional feature selection, especially in tasks that require a minimal number of features without sacrificing classification performance. By significantly reducing dimensionality while maintaining or improving predictive accuracy, DMLC-MTO demonstrates an effective trade-off between model simplicity and discriminative power. These findings further confirm the algorithm&#x2019;s suitability for practical applications and provide a solid foundation for future research.</p>
</sec>
<sec id="sec17">
<label>4.2.3</label>
<title>Training time comparison</title>
<p><xref ref-type="fig" rid="fig6">Figure 5</xref> presents the training time comparison among all algorithms, highlighting the computational efficiency of DMLC-MTO. Benefiting from its integrated multitask mechanism and efficient search dynamics, DMLC-MTO significantly reduces redundant computations while maintaining solution quality, leading to superior runtime performance across all datasets.</p>
<fig position="float" id="fig6">
<label>Figure 5</label>
<caption>
<p>Average CPU running time.</p>
</caption>
<graphic xlink:href="frai-08-1667167-g006.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Bar chart displaying the average CPU running time across various datasets. The datasets include SRBCT, warpPIE10P, Lymphoma, Nci, Leukemia 1, DLBCL, Prostate6033, ALLAML, Nci9, orlraws10P, Prostate, Leukemia 2, and Lung Cancer. The methods compared are PSO, CSO-FS, PSO-EMT, MTPSO, and DMLC-DTO, represented by different colored bars. Time is measured in seconds on the vertical axis, ranging from zero to eight thousand nine hundred twenty-one. PSO generally shows longer running times across datasets.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec id="sec18">
<label>4.3</label>
<title>Mechanism analysis of DMLC-DTO</title>
<sec id="sec19">
<label>4.3.1</label>
<title>Evaluation of multi-criteria task generation strategy</title>
<p>To assess the effectiveness of the proposed multi-criteria task generation strategy, it is compared against three widely used feature evaluation methods: Relief-F, Pearson Correlation Coefficient (PCC), and Total Variance (TV). The comparison was conducted across 13 datasets of varying dimensionality, evaluating both the size of the selected feature subset and the resulting classification accuracy. The detailed results are presented in <xref ref-type="table" rid="tab5">Table 5</xref>.</p>
<table-wrap position="float" id="tab5">
<label>Table 5</label>
<caption>
<p>Comparison of the different task generation methods.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Dataset</th>
<th align="center" valign="top">Method</th>
<th align="center" valign="top">Subset no.</th>
<th align="center" valign="top">Accuracy</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle" rowspan="4">SRBCT</td>
<td align="center" valign="middle">Relief-F</td>
<td align="center" valign="middle">54.4</td>
<td align="center" valign="middle">95.23</td>
</tr>
<tr>
<td align="center" valign="middle">PCC</td>
<td align="center" valign="middle">70.5</td>
<td align="center" valign="middle">94.58</td>
</tr>
<tr>
<td align="center" valign="middle">TV</td>
<td align="center" valign="middle">87.1</td>
<td align="center" valign="middle">88.33</td>
</tr>
<tr>
<td align="center" valign="middle">Multi-criteria task generation</td>
<td align="center" valign="top"><bold>47.18</bold></td>
<td align="center" valign="top"><bold>95.3</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="4">warpPIE10P</td>
<td align="center" valign="middle">Relief-F</td>
<td align="center" valign="middle">43.7</td>
<td align="center" valign="middle">98.5</td>
</tr>
<tr>
<td align="center" valign="middle">PCC</td>
<td align="center" valign="middle">42.3</td>
<td align="center" valign="middle">98.2</td>
</tr>
<tr>
<td align="center" valign="middle">TV</td>
<td align="center" valign="middle">70.8</td>
<td align="center" valign="middle">97.3</td>
</tr>
<tr>
<td align="center" valign="middle">Multi-criteria task generation</td>
<td align="center" valign="middle"><bold>32.52</bold></td>
<td align="center" valign="middle"><bold>99.13</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="4">Lymphoma</td>
<td align="center" valign="middle">Relief-F</td>
<td align="center" valign="middle">97.2</td>
<td align="center" valign="middle">99.16</td>
</tr>
<tr>
<td align="center" valign="middle">PCC</td>
<td align="center" valign="middle">83.2</td>
<td align="center" valign="middle">98.9</td>
</tr>
<tr>
<td align="center" valign="middle">TV</td>
<td align="center" valign="middle">81.6</td>
<td align="center" valign="middle">98.5</td>
</tr>
<tr>
<td align="center" valign="middle">Multi-criteria task generation</td>
<td align="center" valign="middle"><bold>56.39</bold></td>
<td align="center" valign="middle"><bold>99.33</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="4">Nci</td>
<td align="center" valign="middle">Relief-F</td>
<td align="center" valign="middle"><bold>133.2</bold></td>
<td align="center" valign="middle">60.57</td>
</tr>
<tr>
<td align="center" valign="middle">PCC</td>
<td align="center" valign="middle">160.8</td>
<td align="center" valign="middle"><bold>70.04</bold></td>
</tr>
<tr>
<td align="center" valign="middle">TV</td>
<td align="center" valign="middle">184</td>
<td align="center" valign="middle">66.02</td>
</tr>
<tr>
<td align="center" valign="middle">Multi-criteria task generation</td>
<td align="center" valign="top">282.12</td>
<td align="center" valign="top">68.98</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="4">Leukemia 1</td>
<td align="center" valign="middle">Relief-F</td>
<td align="center" valign="middle">122.7</td>
<td align="center" valign="middle">87.77</td>
</tr>
<tr>
<td align="center" valign="middle">PCC</td>
<td align="center" valign="middle">156.8</td>
<td align="center" valign="middle">88.35</td>
</tr>
<tr>
<td align="center" valign="middle">TV</td>
<td align="center" valign="middle"><bold>120.6</bold></td>
<td align="center" valign="middle">88.11</td>
</tr>
<tr>
<td align="center" valign="middle">Multi-criteria task generation</td>
<td align="center" valign="top">230.22</td>
<td align="center" valign="top"><bold>87.86</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="4">DLBCL</td>
<td align="center" valign="middle">Relief-F</td>
<td align="center" valign="middle">307.8</td>
<td align="center" valign="middle">86.5</td>
</tr>
<tr>
<td align="center" valign="middle">PCC</td>
<td align="center" valign="middle">179.2</td>
<td align="center" valign="middle"><bold>89.83</bold></td>
</tr>
<tr>
<td align="center" valign="middle">TV</td>
<td align="center" valign="middle">524.4</td>
<td align="center" valign="middle">85.33</td>
</tr>
<tr>
<td align="center" valign="middle">Multi-criteria task generation</td>
<td align="center" valign="middle"><bold>158.33</bold></td>
<td align="center" valign="middle">89.56</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="4">Prostate6033</td>
<td align="center" valign="middle">Relief-F</td>
<td align="center" valign="middle">191.2</td>
<td align="center" valign="middle">86.16</td>
</tr>
<tr>
<td align="center" valign="middle">PCC</td>
<td align="center" valign="middle">133.5</td>
<td align="center" valign="middle">86.33</td>
</tr>
<tr>
<td align="center" valign="middle">TV</td>
<td align="center" valign="middle">251.5</td>
<td align="center" valign="middle">85.5</td>
</tr>
<tr>
<td align="center" valign="middle">Multi-criteria task generation</td>
<td align="center" valign="top"><bold>113.82</bold></td>
<td align="center" valign="top"><bold>86.66</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="4">ALLAML</td>
<td align="center" valign="middle">Relief-F</td>
<td align="center" valign="middle">95.4</td>
<td align="center" valign="middle">88.41</td>
</tr>
<tr>
<td align="center" valign="middle">PCC</td>
<td align="center" valign="middle">111.8</td>
<td align="center" valign="middle">93.16</td>
</tr>
<tr>
<td align="center" valign="middle">TV</td>
<td align="center" valign="middle">152.7</td>
<td align="center" valign="middle">91.16</td>
</tr>
<tr>
<td align="center" valign="middle">Multi-criteria task generation</td>
<td align="center" valign="top"><bold>79.93</bold></td>
<td align="center" valign="top"><bold>94.10</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="4">Nci9</td>
<td align="center" valign="middle">Relief-F</td>
<td align="center" valign="middle">1438.2</td>
<td align="center" valign="middle">46.22</td>
</tr>
<tr>
<td align="center" valign="middle">PCC</td>
<td align="center" valign="middle">1194.1</td>
<td align="center" valign="middle">51.14</td>
</tr>
<tr>
<td align="center" valign="middle">TV</td>
<td align="center" valign="middle"><bold>1074.4</bold></td>
<td align="center" valign="middle"><bold>52.09</bold></td>
</tr>
<tr>
<td align="center" valign="middle">Multi-criteria task generation</td>
<td align="center" valign="top">1947.22</td>
<td align="center" valign="top">51.12</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="4">Orlraws10P</td>
<td align="center" valign="middle">Relief-F</td>
<td align="center" valign="middle">136.9</td>
<td align="center" valign="middle">94.2</td>
</tr>
<tr>
<td align="center" valign="middle">PCC</td>
<td align="center" valign="middle">305.5</td>
<td align="center" valign="middle">92.5</td>
</tr>
<tr>
<td align="center" valign="middle">TV</td>
<td align="center" valign="middle">100.8</td>
<td align="center" valign="middle">96.1</td>
</tr>
<tr>
<td align="center" valign="middle">Multi-criteria task generation</td>
<td align="center" valign="top"><bold>63.28</bold></td>
<td align="center" valign="top"><bold>98.2</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="4">Prostate</td>
<td align="center" valign="middle">Relief-F</td>
<td align="center" valign="middle"><bold>174.8</bold></td>
<td align="center" valign="middle">82.16</td>
</tr>
<tr>
<td align="center" valign="middle">PCC</td>
<td align="center" valign="middle">185.3</td>
<td align="center" valign="middle">84.5</td>
</tr>
<tr>
<td align="center" valign="middle">TV</td>
<td align="center" valign="middle">524.4</td>
<td align="center" valign="middle">85.33</td>
</tr>
<tr>
<td align="center" valign="middle">Multi-criteria task generation</td>
<td align="center" valign="top">231.32</td>
<td align="center" valign="top"><bold>88.38</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="4">Leukemia 2</td>
<td align="center" valign="middle">Relief-F</td>
<td align="center" valign="middle">354.9</td>
<td align="center" valign="middle"><bold>91.66</bold></td>
</tr>
<tr>
<td align="center" valign="middle">PCC</td>
<td align="center" valign="middle">387</td>
<td align="center" valign="middle">88.33</td>
</tr>
<tr>
<td align="center" valign="middle">TV</td>
<td align="center" valign="middle">298.3</td>
<td align="center" valign="middle">88.33</td>
</tr>
<tr>
<td align="center" valign="middle">Multi-criteria task generation</td>
<td align="center" valign="middle"><bold>285.58</bold></td>
<td align="center" valign="middle">88.12</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="4">Lung cancer</td>
<td align="center" valign="middle">Relief-F</td>
<td align="center" valign="middle">222.7</td>
<td align="center" valign="middle">79.13</td>
</tr>
<tr>
<td align="center" valign="middle">PCC</td>
<td align="center" valign="middle">434.4</td>
<td align="center" valign="middle">86.08</td>
</tr>
<tr>
<td align="center" valign="middle">TV</td>
<td align="center" valign="middle"><bold>126.9</bold></td>
<td align="center" valign="middle">82.71</td>
</tr>
<tr>
<td align="center" valign="middle">Multi-criteria task generation</td>
<td align="center" valign="top">322.48</td>
<td align="center" valign="top"><bold>87.22</bold></td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Best results are highlighted in bold.</p>
</table-wrap-foot>
</table-wrap>
<p>Overall, the proposed strategy demonstrates competitive or superior performance across most datasets. In terms of classification accuracy, the multi-criteria approach achieves the highest score in seven out of 13 datasets, and performs comparably in five others. For instance, on the warpPIE10P dataset, it achieves 99.13% accuracy using only 32.52 features, outperforming all baseline methods in both accuracy and feature compactness. Similarly, on Lymphoma, it reaches 99.33% accuracy while reducing the feature subset size to 56.39, significantly lower than Relief-F&#x2019;s 97.2 features.</p>
<p>In high-dimensional datasets such as Orlraws10P and DLBCL, the multi-criteria strategy also shows clear advantages. On Orlraws10P, it achieves the highest accuracy (98.2%) with the smallest feature subset (63.28), illustrating the effectiveness of combining multiple relevance indicators to filter redundant features. In DLBCL, it selects fewer features (158.33) than most methods while maintaining high accuracy (89.56%), nearly matching PCC&#x2019;s best performance (89.83%) with improved compactness.</p>
<p>It is worth noting that in some datasets like Nci9 and Leukemia 2, the proposed method selects a relatively larger number of features. In Nci9, although the feature count increases to 1947.22, the classification accuracy (51.12%) remains competitive with PCC (51.14%) and higher than Relief-F (46.22%). This suggests that, in certain cases, the adaptive thresholding mechanism may favor retaining more features to ensure sufficient representation, especially when the informative features are not well distinguished by individual metrics alone.</p>
<p>Another observation lies in the Prostate6033 and Prostate datasets, where the proposed method outperforms baseline methods in accuracy (e.g., 86.66% and 88.38%, respectively) while also maintaining relatively small feature subsets compared to TV or PCC. This highlights its capacity to balance global relevance and local refinement through dynamic integration of multiple scoring criteria.</p>
<p>In conclusion, the multi-criteria task generation strategy shows strong robustness and adaptability across various datasets. It consistently strikes a favorable trade-off between feature subset size and classification performance. By leveraging the complementary strengths of Relief-F and Fisher Score, and incorporating adaptive knee-point detection, the proposed approach enhances the reliability of feature relevance estimation and improves the initialization of auxiliary tasks in the multitask framework. These results demonstrate that the proposed task construction mechanism is an effective foundation for the DMLC-MTO algorithm.</p>
</sec>
<sec id="sec20">
<label>4.3.2</label>
<title>Elite-guided competitive particle swarm optimization</title>
<p>To further evaluate the effectiveness of the proposed knowledge transfer strategy, three variants of the algorithm is considered for comparison: (1) CSO, which relies solely on traditional pairwise competition without elite or task-level interaction; (2) EC-PSO, which introduces elite-based competition but performs optimization independently within each task; and (3) EC-PSO&#x202F;+&#x202F;knowledge transfer, which enhances EC-PSO with inter-task knowledge exchange via elite guidance. The corresponding results are visualized in <xref ref-type="fig" rid="fig7">Figures 6</xref>, <xref ref-type="fig" rid="fig8">7</xref>, where the bar charts provide an intuitive comparison of classification accuracy and the number of selected features across different methods. As shown in <xref ref-type="table" rid="tab6">Table 6</xref>, the inclusion of knowledge transfer consistently improves both classification accuracy and feature compactness across most datasets.</p>
<fig position="float" id="fig7">
<label>Figure 6</label>
<caption>
<p>Comparison of the subset number obtained by different optimization and knowledge transfer strategies.</p>
</caption>
<graphic xlink:href="frai-08-1667167-g007.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Bar chart comparing subset numbers across datasets with three methods: CSO, EC-PSO, and EC-PSO with Knowledge Transfer. Datasets include SR8CT, warPPLE10P, Lymphoma, Ncl, Leukemia 1, DLBCL, Prostate, 26033, ALLAML, Ncl9, Orlraws10P, Leukemia 2, and Lung Cancer. Notable variation occurs with Ncl9 showing the highest values for all methods, while other datasets present smaller differences.</alt-text>
</graphic>
</fig>
<fig position="float" id="fig8">
<label>Figure 7</label>
<caption>
<p>Comparison of accuracy obtained by different optimization and knowledge transfer strategies.</p>
</caption>
<graphic xlink:href="frai-08-1667167-g008.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Bar chart comparing accuracy percentages across datasets for three methods: CSO, EC-PSO, and EC-PSO with Knowledge Transfer. Accuracy is highest across SRBCT, warpPIE10P, and ALLAML datasets, with slight variations among methods. Lower performance is observed for NCI9.</alt-text>
</graphic>
</fig>
<table-wrap position="float" id="tab6">
<label>Table 6</label>
<caption>
<p>Comparison of the different optimization and knowledge transfer strategies.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Dataset</th>
<th align="center" valign="top">Method</th>
<th align="center" valign="top">Subset no.</th>
<th align="center" valign="top">Accuracy</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle" rowspan="3">SRBCT</td>
<td align="center" valign="middle">CSO</td>
<td align="center" valign="middle">50.8</td>
<td align="center" valign="middle">94.16</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO</td>
<td align="center" valign="middle">62.32</td>
<td align="center" valign="middle">95.11</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO&#x202F;+&#x202F;knowledge transfer</td>
<td align="center" valign="middle"><bold>47.18</bold></td>
<td align="center" valign="middle"><bold>95.3</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">warpPIE10P</td>
<td align="center" valign="middle">CSO</td>
<td align="center" valign="middle">37.86</td>
<td align="center" valign="middle">98.63</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO</td>
<td align="center" valign="middle">42.31</td>
<td align="center" valign="middle">97.82</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO&#x202F;+&#x202F;knowledge transfer</td>
<td align="center" valign="middle"><bold>32.52</bold></td>
<td align="center" valign="middle"><bold>99.13</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">Lymphoma</td>
<td align="center" valign="middle">CSO</td>
<td align="center" valign="middle">89.42</td>
<td align="center" valign="middle">98.11</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO</td>
<td align="center" valign="middle">72.13</td>
<td align="center" valign="middle">97.32</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO&#x202F;+&#x202F;knowledge transfer</td>
<td align="center" valign="middle"><bold>56.39</bold></td>
<td align="center" valign="middle"><bold>99.33</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">Nci</td>
<td align="center" valign="middle">CSO</td>
<td align="center" valign="middle">323.86</td>
<td align="center" valign="middle">67.13</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO</td>
<td align="center" valign="middle">352.12</td>
<td align="center" valign="middle">66.92</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO&#x202F;+&#x202F;knowledge transfer</td>
<td align="center" valign="middle"><bold>282.12</bold></td>
<td align="center" valign="middle"><bold>68.98</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">Leukemia 1</td>
<td align="center" valign="middle">CSO</td>
<td align="center" valign="middle"><bold>212.25</bold></td>
<td align="center" valign="middle">85.23</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO</td>
<td align="center" valign="middle">301.63</td>
<td align="center" valign="middle">87.6</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO&#x202F;+&#x202F;knowledge transfer</td>
<td align="center" valign="middle">230.22</td>
<td align="center" valign="middle"><bold>87.86</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">DLBCL</td>
<td align="center" valign="middle">CSO</td>
<td align="center" valign="middle">237.36</td>
<td align="center" valign="middle">86.46</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO</td>
<td align="center" valign="middle">322.12</td>
<td align="center" valign="middle">87.81</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO&#x202F;+&#x202F;knowledge transfer</td>
<td align="center" valign="middle"><bold>200.22</bold></td>
<td align="center" valign="middle"><bold>89.78</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">Prostate6033</td>
<td align="center" valign="middle">CSO</td>
<td align="center" valign="middle">118.76</td>
<td align="center" valign="middle">85.93</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO</td>
<td align="center" valign="middle">142.12</td>
<td align="center" valign="middle">86.2</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO&#x202F;+&#x202F;knowledge transfer</td>
<td align="center" valign="middle"><bold>113.82</bold></td>
<td align="center" valign="middle"><bold>86.66</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">ALLAML</td>
<td align="center" valign="middle">CSO</td>
<td align="center" valign="middle">86.43</td>
<td align="center" valign="middle">91.22</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO</td>
<td align="center" valign="middle">92.11</td>
<td align="center" valign="middle">93.32</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO&#x202F;+&#x202F;knowledge transfer</td>
<td align="center" valign="middle"><bold>79.93</bold></td>
<td align="center" valign="middle"><bold>94.10</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">Nci9</td>
<td align="center" valign="middle">CSO</td>
<td align="center" valign="middle">2032.12</td>
<td align="center" valign="middle">49.24</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO</td>
<td align="center" valign="middle"><bold>1323.11</bold></td>
<td align="center" valign="middle">46.23</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO&#x202F;+&#x202F;knowledge transfer</td>
<td align="center" valign="middle">1947.22</td>
<td align="center" valign="middle"><bold>51.12</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">Orlraws10P</td>
<td align="center" valign="middle">CSO</td>
<td align="center" valign="middle">87.2</td>
<td align="center" valign="middle">97.2</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO</td>
<td align="center" valign="middle">99.2</td>
<td align="center" valign="middle">96.2</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO&#x202F;+&#x202F;knowledge transfer</td>
<td align="center" valign="middle"><bold>63.28</bold></td>
<td align="center" valign="middle"><bold>98.2</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">Prostate</td>
<td align="center" valign="middle">CSO</td>
<td align="center" valign="middle"><bold>206.4</bold></td>
<td align="center" valign="middle">87.96</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO</td>
<td align="center" valign="middle">261.2</td>
<td align="center" valign="middle">86.91</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO&#x202F;+&#x202F;knowledge transfer</td>
<td align="center" valign="middle">231.32</td>
<td align="center" valign="middle"><bold>88.38</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">Leukemia 2</td>
<td align="center" valign="middle">CSO</td>
<td align="center" valign="middle">300.32</td>
<td align="center" valign="middle">86.22</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO</td>
<td align="center" valign="middle">321.42</td>
<td align="center" valign="middle">85.11</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO&#x202F;+&#x202F;knowledge transfer</td>
<td align="center" valign="middle"><bold>285.58</bold></td>
<td align="center" valign="middle"><bold>88.12</bold></td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">Lung cancer</td>
<td align="center" valign="middle">CSO</td>
<td align="center" valign="middle">412.12</td>
<td align="center" valign="middle">86.54</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO</td>
<td align="center" valign="middle">362.42</td>
<td align="center" valign="middle">86.23</td>
</tr>
<tr>
<td align="center" valign="middle">EC-PSO&#x202F;+&#x202F;knowledge transfer</td>
<td align="center" valign="middle"><bold>322.48</bold></td>
<td align="center" valign="middle"><bold>87.22</bold></td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Best results are highlighted in bold.</p>
</table-wrap-foot>
</table-wrap>
<p>While EC-PSO already improves upon CSO by leveraging elite-driven intra-task learning (e.g., on DLBCL and ALLAML datasets), the incorporation of cross-task knowledge sharing in EC-PSO&#x202F;+&#x202F;Knowledge Transfer brings further benefits. It achieves the best performance on nearly all datasets in terms of accuracy, while selecting fewer features in most cases. These results suggest that cross-task learning enables more effective exploration of the search space and promotes better generalization. Therefore, the proposed transfer mechanism not only enhances the performance of individual tasks but also facilitates collaboration between tasks to address the challenges of high-dimensional feature selection.</p>
</sec>
</sec>
</sec>
<sec sec-type="conclusions" id="sec21">
<label>5</label>
<title>Conclusion</title>
<p>This paper presents DMLC-MTO, a dynamic multitask evolutionary feature selection algorithm that integrates multi-indicator task generation, elite competition learning, and spatially-aware knowledge transfer. The framework effectively addresses the challenges of high-dimensional data by enabling precise evaluation of feature subsets and improving optimization efficiency through adaptive inter-task collaboration. Extensive experiments on 13 benchmark datasets demonstrate that DMLC-MTO consistently achieves superior classification accuracy with more compact feature sets compared to existing evolutionary feature selection methods. The combination of complementary filter-based indicators with competitive and transfer mechanisms guides the search toward informative and less redundant features, highlighting the framework&#x2019;s practical value in applications such as tobacco leaf grading, quality assessment, and agricultural phenotype analysis.</p>
<p>While the results validate the method&#x2019;s effectiveness, limitations remain. The reliance on filter-based indicators may not fully capture complex nonlinear feature dependencies, some hyperparameters are fixed, and evaluation has been restricted to high-dimensional gene expression and image datasets. Furthermore, qualitative interpretability of the selected features and more rigorous statistical analyses have yet to be explored. Future work will focus on addressing these limitations by incorporating adaptive hyperparameter tuning, evaluating broader and more diverse datasets, enhancing interpretability, and extending the framework to handle multi-label and unsupervised scenarios, thereby strengthening its robustness and broadening its applicability.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec22">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/supplementary material, further inquiries can be directed to the corresponding authors.</p>
</sec>
<sec sec-type="author-contributions" id="sec23">
<title>Author contributions</title>
<p>JT: Methodology, Writing &#x2013; original draft, Conceptualization, Funding acquisition, Data curation. CY: Data curation, Validation, Writing &#x2013; original draft, Conceptualization. MaL: Formal analysis, Writing &#x2013; original draft, Visualization. JG: Resources, Methodology, Investigation, Writing &#x2013; original draft. YW: Validation, Writing &#x2013; review &#x0026; editing, Software. HF: Writing &#x2013; original draft, Formal analysis, Conceptualization. MeL: Funding acquisition, Project administration, Writing &#x2013; review &#x0026; editing, Supervision. WZ: Conceptualization, Methodology, Software, Writing &#x2013; original draft. JL: Writing &#x2013; review &#x0026; editing, Resources, Supervision, Project administration.</p>
</sec>
<sec sec-type="funding-information" id="sec24">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This research was supported by the Planning Fund for Humanities and Social Sciences Research of the Ministry of Education (Grant No. 24YJAZH229), the Innovation Talent Program for Science and Technology in Higher Education of Henan Province (Grant No. 25HASTIT030) and the Science and Technology Project of China Tobacco Zhejiang Industrial Co., Ltd (Grant No. ZJZY2023D020).</p>
</sec>
<sec sec-type="COI-statement" id="sec25">
<title>Conflict of interest</title>
<p>JT, CY, JG, YW, HF, JL, and MaL were employed by China Tobacco Zhejiang Industrial Co., Ltd.</p>
<p>The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="sec26">
<title>Generative AI statement</title>
<p>The authors declare that no Gen AI was used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="sec27">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ansari</surname><given-names>G.</given-names></name> <name><surname>Ahmad</surname><given-names>T.</given-names></name> <name><surname>Doja</surname><given-names>M. N.</given-names></name></person-group> (<year>2019</year>). <article-title>Hybrid filter&#x2013;wrapper feature selection method for sentiment classification</article-title>. <source>Arab. J. Sci. Eng.</source> <volume>44</volume>, <fpage>9191</fpage>&#x2013;<lpage>9208</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s13369-019-04064-6</pub-id></citation></ref>
<ref id="ref2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chaudhuri</surname><given-names>A.</given-names></name> <name><surname>Sahu</surname><given-names>T. P.</given-names></name></person-group> (<year>2021</year>). <article-title>A hybrid feature selection method based on binary Jaya algorithm for micro-array data classification</article-title>. <source>Comput. Electr. Eng.</source> <volume>90</volume>:<fpage>106963</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.compeleceng.2020.106963</pub-id></citation></ref>
<ref id="ref3"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Chen</surname><given-names>J.</given-names></name> <name><surname>Li</surname><given-names>T.</given-names></name> <name><surname>Zou</surname><given-names>Y.</given-names></name> <name><surname>Wang</surname><given-names>G.</given-names></name> <name><surname>Ye</surname><given-names>H.</given-names></name> <name><surname>Lv</surname><given-names>F.</given-names></name></person-group> (<year>2019</year>). <source>An ensemble feature selection method for short-term electrical load forecasting</source>. In <conf-name>2019 IEEE 3rd Conference on Energy Internet and Energy System Integration (EI2)</conf-name>. <publisher-name>IEEE</publisher-name>, 1429&#x2013;1432.</citation></ref>
<ref id="ref4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname><given-names>K.</given-names></name> <name><surname>Xue</surname><given-names>B.</given-names></name> <name><surname>Zhang</surname><given-names>M.</given-names></name> <name><surname>Zhou</surname><given-names>F.</given-names></name></person-group> (<year>2020</year>). <article-title>An evolutionary multitasking-based feature selection method for high-dimensional classification</article-title>. <source>IEEE Trans. Cybern.</source> <volume>52</volume>, <fpage>7172</fpage>&#x2013;<lpage>7186</lpage>.</citation></ref>
<ref id="ref5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname><given-names>K.</given-names></name> <name><surname>Xue</surname><given-names>B.</given-names></name> <name><surname>Zhang</surname><given-names>M.</given-names></name> <name><surname>Zhou</surname><given-names>F.</given-names></name></person-group> (<year>2021</year>). <article-title>Evolutionary multitasking for feature selection in high-dimensional classification via particle swarm optimization</article-title>. <source>IEEE Trans. Evol. Comput.</source> <volume>26</volume>, <fpage>446</fpage>&#x2013;<lpage>460</lpage>.</citation></ref>
<ref id="ref6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dakic</surname><given-names>P.</given-names></name> <name><surname>Zivkovic</surname><given-names>M.</given-names></name> <name><surname>Jovanovic</surname><given-names>L.</given-names></name> <name><surname>Bacanin</surname><given-names>N.</given-names></name> <name><surname>Antonijevic</surname><given-names>M.</given-names></name> <name><surname>Kaljevic</surname><given-names>J.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Intrusion detection using metaheuristic optimization within IoT/IIoT systems and software of autonomous vehicles</article-title>. <source>Sci. Rep.</source> <volume>14</volume>:<fpage>22884</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-024-73932-5</pub-id>, PMID: <pub-id pub-id-type="pmid">39358433</pub-id></citation></ref>
<ref id="ref7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ding</surname><given-names>Y.</given-names></name> <name><surname>Zhou</surname><given-names>K.</given-names></name> <name><surname>Bi</surname><given-names>W.</given-names></name></person-group> (<year>2020</year>). <article-title>Feature selection based on hybridization of genetic algorithm and competitive swarm optimizer</article-title>. <source>Soft. Comput.</source> <volume>24</volume>, <fpage>11663</fpage>&#x2013;<lpage>11672</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00500-019-04628-6</pub-id></citation></ref>
<ref id="ref8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fern&#x00E1;ndez-Diego</surname><given-names>M.</given-names></name> <name><surname>Gonz&#x00E1;lez-Ladr&#x00F3;n-de-Guevara</surname><given-names>F.</given-names></name></person-group> (<year>2018</year>). <article-title>Application of mutual information-based sequential feature selection to ISBSG mixed data</article-title>. <source>Softw. Qual. J.</source> <volume>26</volume>, <fpage>1299</fpage>&#x2013;<lpage>1325</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11219-017-9391-5</pub-id>, PMID: <pub-id pub-id-type="pmid">41020202</pub-id></citation></ref>
<ref id="ref9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guan</surname><given-names>S. U.</given-names></name> <name><surname>Liu</surname><given-names>J.</given-names></name> <name><surname>Qi</surname><given-names>Y.</given-names></name></person-group> (<year>2004</year>). <article-title>An incremental approach to contribution-based feature selection</article-title>. <source>J. Intell. Syst.</source> <volume>13</volume>, <fpage>15</fpage>&#x2013;<lpage>42</lpage>. doi: <pub-id pub-id-type="doi">10.1515/JISYS.2004.13.1.15</pub-id>, PMID: <pub-id pub-id-type="pmid">40896160</pub-id></citation></ref>
<ref id="ref10"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Hall</surname><given-names>M. A.</given-names></name></person-group> (<year>1999</year>) Correlation-based feature selection for machine learning (Doctoral dissertation, The University of Waikato)</citation></ref>
<ref id="ref11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huda</surname><given-names>R. K.</given-names></name> <name><surname>Banka</surname><given-names>H.</given-names></name></person-group> (<year>2019</year>). <article-title>Efficient feature selection and classification algorithm based on PSO and rough sets</article-title>. <source>Neural Comput. Appl.</source> <volume>31</volume>, <fpage>4287</fpage>&#x2013;<lpage>4303</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00521-017-3317-9</pub-id></citation></ref>
<ref id="ref12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kamalov</surname><given-names>F.</given-names></name> <name><surname>Sulieman</surname><given-names>H.</given-names></name> <name><surname>Alzaatreh</surname><given-names>A.</given-names></name> <name><surname>Emarly</surname><given-names>M.</given-names></name> <name><surname>Chamlal</surname><given-names>H.</given-names></name> <name><surname>Safaraliev</surname><given-names>M.</given-names></name></person-group> (<year>2025</year>). <article-title>Mathematical methods in feature selection: a review</article-title>. <source>Mathematics</source> <volume>13</volume>:<fpage>996</fpage>. doi: <pub-id pub-id-type="doi">10.3390/math13060996</pub-id></citation></ref>
<ref id="ref13"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Kononenko</surname><given-names>I.</given-names></name></person-group> (<year>1994</year>). &#x201C;<article-title>Estimating attributes: analysis and extensions of RELIEF</article-title>&#x201D; in <source>European Conference on Machine Learning</source> (<publisher-loc>Berlin, Heidelberg</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>171</fpage>&#x2013;<lpage>182</lpage>.</citation></ref>
<ref id="ref14"><citation citation-type="confproc"><person-group person-group-type="author"><name><surname>Li</surname><given-names>X.</given-names></name> <name><surname>Li</surname><given-names>B.</given-names></name> <name><surname>Wang</surname><given-names>Y.</given-names></name></person-group> (<year>2023</year>). <source>Multiobjective fuzzy competitive swarm optimization for high-dimensional feature selection</source>. In <conf-name>2023 5th International Conference on Data-driven Optimization of Complex Systems (DOCS)</conf-name>. <publisher-loc>Tianjin, China</publisher-loc>, <publisher-name>IEEE</publisher-name>. <fpage>1</fpage>&#x2013;<lpage>6</lpage></citation></ref>
<ref id="ref15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>L.</given-names></name> <name><surname>Xuan</surname><given-names>M.</given-names></name> <name><surname>Lin</surname><given-names>Q.</given-names></name> <name><surname>Jiang</surname><given-names>M.</given-names></name> <name><surname>Ming</surname><given-names>Z.</given-names></name> <name><surname>Tan</surname><given-names>K. C.</given-names></name></person-group> (<year>2023</year>). <article-title>An evolutionary multitasking algorithm with multiple filtering for high-dimensional feature selection</article-title>. <source>IEEE Trans. Evol. Comput.</source> <volume>27</volume>, <fpage>802</fpage>&#x2013;<lpage>816</lpage>. doi: <pub-id pub-id-type="doi">10.1109/TEVC.2023.3254155</pub-id></citation></ref>
<ref id="ref16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lohitha</surname><given-names>N. S.</given-names></name> <name><surname>Pounambal</surname><given-names>M.</given-names></name></person-group> (<year>2022</year>). <article-title>A novel hybrid spotted hyena-swarm optimization (HS-FFO) framework for effective feature selection in iot based cloud security data</article-title>. <source>Int. J. Recent Innov. Trends Comput. Commun.</source> <volume>10</volume>, <fpage>290</fpage>&#x2013;<lpage>303</lpage>. doi: <pub-id pub-id-type="doi">10.17762/ijritcc.v10i1s.5851</pub-id></citation></ref>
<ref id="ref17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mladenovic</surname><given-names>D.</given-names></name> <name><surname>Antonijevic</surname><given-names>M.</given-names></name> <name><surname>Jovanovic</surname><given-names>L.</given-names></name> <name><surname>Simic</surname><given-names>V.</given-names></name> <name><surname>Zivkovic</surname><given-names>M.</given-names></name> <name><surname>Bacanin</surname><given-names>N.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Sentiment classification for insider threat identification using metaheuristic optimized machine learning classifiers</article-title>. <source>Sci. Rep.</source>:<fpage>25731</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-024-77240-w</pub-id></citation></ref>
<ref id="ref18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pandey</surname><given-names>A. C.</given-names></name> <name><surname>Rajpoot</surname><given-names>D. S.</given-names></name> <name><surname>Saraswat</surname><given-names>M.</given-names></name></person-group> (<year>2020</year>). <article-title>Feature selection method based on hybrid data transformation and binary binomial cuckoo search</article-title>. <source>J. Ambient. Intell. Humaniz. Comput.</source> <volume>11</volume>, <fpage>719</fpage>&#x2013;<lpage>738</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s12652-019-01330-1</pub-id></citation></ref>
<ref id="ref19"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Patterson</surname><given-names>G.</given-names></name> <name><surname>Zhang</surname><given-names>M.</given-names></name></person-group> (<year>2007</year>). &#x201C;<article-title>Fitness functions in genetic programming for classification with unbalanced data</article-title>&#x201D; in <source>Australasian Joint Conference on Artificial Intelligence</source>. ed. M. A. Orgun and J. Thornton (<publisher-loc>Berlin, Heidelberg</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>769</fpage>&#x2013;<lpage>775</lpage>. doi: <pub-id pub-id-type="doi">10.1007/978-3-540-76928-6_90</pub-id></citation></ref>
<ref id="ref20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Paul</surname><given-names>J.</given-names></name> <name><surname>Dupont</surname><given-names>P.</given-names></name></person-group> (<year>2015</year>). <article-title>Kernel methods for heterogeneous feature selection</article-title>. <source>Neurocomputing</source> <volume>169</volume>, <fpage>187</fpage>&#x2013;<lpage>195</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.neucom.2014.12.098</pub-id></citation></ref>
<ref id="ref21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pichai</surname><given-names>S.</given-names></name> <name><surname>Sunat</surname><given-names>K.</given-names></name> <name><surname>Chiewchanwattana</surname><given-names>S.</given-names></name></person-group> (<year>2020</year>). <article-title>An asymmetric chaotic competitive swarm optimization algorithm for feature selection in high-dimensional data</article-title>. <source>Symmetry</source> <volume>12</volume>:<fpage>1782</fpage>. doi: <pub-id pub-id-type="doi">10.3390/sym12111782</pub-id>, PMID: <pub-id pub-id-type="pmid">40881048</pub-id></citation></ref>
<ref id="ref22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sadeghian</surname><given-names>Z.</given-names></name> <name><surname>Akbari</surname><given-names>E.</given-names></name> <name><surname>Nematzadeh</surname><given-names>H.</given-names></name> <name><surname>Motameni</surname><given-names>H.</given-names></name></person-group> (<year>2025</year>). <article-title>A review of feature selection methods based on meta-heuristic algorithms</article-title>. <source>J. Exp. Theor. Artif. Intell.</source> <volume>37</volume>, <fpage>1</fpage>&#x2013;<lpage>51</lpage>. doi: <pub-id pub-id-type="doi">10.1080/0952813X.2023.2183267</pub-id></citation></ref>
<ref id="ref23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Salb</surname><given-names>M.</given-names></name> <name><surname>Jovanovic</surname><given-names>L.</given-names></name> <name><surname>Elsadai</surname><given-names>D. Z. M.</given-names></name></person-group> (<year>2024</year>). <article-title>Cloud spot instance price forecasting multi-headed models tuned using modified PSO</article-title>. <source>J. King Saud Univ. Sci.</source> <volume>36</volume>:<fpage>103473</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jksus.2024.103473</pub-id>, PMID: <pub-id pub-id-type="pmid">41016916</pub-id></citation></ref>
<ref id="ref24"><citation citation-type="confproc"><person-group person-group-type="author"><name><surname>Senliol</surname><given-names>B.</given-names></name> <name><surname>Gulgezen</surname><given-names>G.</given-names></name> <name><surname>Yu</surname><given-names>L.</given-names></name> <name><surname>Cataltepe</surname><given-names>Z.</given-names></name></person-group> (<year>2008</year>). <source>Fast Correlation Based Filter (FCBF) with a different search strategy</source>. In <conf-name>2008 23rd International Symposium on Computer and Information Sciences</conf-name>. <publisher-name>IEEE</publisher-name>, <fpage>1</fpage>&#x2013;<lpage>4</lpage></citation></ref>
<ref id="ref25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Solorio</surname><given-names>F. S.</given-names></name> <name><surname>Carrasco-Ochoa</surname><given-names>J. A.</given-names></name> <name><surname>Mart&#x00ED;nez-Trinidad</surname><given-names>J. F.</given-names></name></person-group> (<year>2024</year>). <article-title>Filter unsupervised spectral feature selection method for mixed data based on a new feature correlation measure</article-title>. <source>Neurocomputing</source> <volume>571</volume>:<fpage>127111</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.neucom.2023.127111</pub-id></citation></ref>
<ref id="ref26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Solorio</surname><given-names>F. S.</given-names></name> <name><surname>Mart&#x00ED;nez</surname><given-names>T. J. F.</given-names></name> <name><surname>Carrasco-Ochoa</surname><given-names>J. A.</given-names></name></person-group> (<year>2020</year>). <article-title>A supervised filter feature selection method for mixed data based on spectral feature selection and information-theory redundancy analysis</article-title>. <source>Pattern Recogn. Lett.</source> <volume>138</volume>, <fpage>321</fpage>&#x2013;<lpage>328</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.patrec.2020.07.039</pub-id></citation></ref>
<ref id="ref27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Song</surname><given-names>X. F.</given-names></name> <name><surname>Zhang</surname><given-names>Y.</given-names></name> <name><surname>Gong</surname><given-names>D. W.</given-names></name> <name><surname>Gao</surname><given-names>X. Z.</given-names></name></person-group> (<year>2021</year>). <article-title>A fast hybrid feature selection based on correlation-guided clustering and particle swarm optimization for high-dimensional data</article-title>. <source>IEEE Trans. Cybern.</source> <volume>52</volume>, <fpage>9573</fpage>&#x2013;<lpage>9586</lpage>.</citation></ref>
<ref id="ref28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Swesi</surname><given-names>I. M. A. O.</given-names></name> <name><surname>Bakar</surname><given-names>A. A.</given-names></name></person-group> (<year>2019</year>). <article-title>Feature clustering for PSO-based feature construction on high-dimensional data</article-title>. <source>J. Inf. Commun. Technol.</source> <volume>18</volume>, <fpage>439</fpage>&#x2013;<lpage>472</lpage>.</citation></ref>
<ref id="ref29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tang</surname><given-names>W.</given-names></name> <name><surname>Mao</surname><given-names>K. Z.</given-names></name></person-group> (<year>2007</year>). <article-title>Feature selection algorithm for mixed data with both nominal and continuous features</article-title>. <source>Pattern Recogn. Lett.</source> <volume>28</volume>, <fpage>563</fpage>&#x2013;<lpage>571</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.patrec.2006.10.008</pub-id></citation></ref>
<ref id="ref30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tian</surname><given-names>Y.</given-names></name> <name><surname>Zheng</surname><given-names>X.</given-names></name> <name><surname>Zhang</surname><given-names>X.</given-names></name> <name><surname>Jin</surname><given-names>Y.</given-names></name></person-group> (<year>2019</year>). <article-title>Efficient large-scale multiobjective optimization based on a competitive swarm optimizer</article-title>. <source>IEEE Trans Cybern</source> <volume>50</volume>, <fpage>3696</fpage>&#x2013;<lpage>3708</lpage>. doi: <pub-id pub-id-type="doi">10.1109/TCYB.2019.2906383</pub-id></citation></ref>
<ref id="ref31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Too</surname><given-names>J.</given-names></name> <name><surname>Abdullah</surname><given-names>A. R.</given-names></name> <name><surname>Mohd Saad</surname><given-names>N.</given-names></name></person-group> (<year>2019</year>). <article-title>Binary competitive swarm optimizer approaches for feature selection</article-title>. <source>Computation</source> <volume>7</volume>:<fpage>31</fpage>. doi: <pub-id pub-id-type="doi">10.3390/computation7020031</pub-id></citation></ref>
<ref id="ref32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tran</surname><given-names>B.</given-names></name> <name><surname>Xue</surname><given-names>B.</given-names></name> <name><surname>Zhang</surname><given-names>M.</given-names></name></person-group> (<year>2018</year>). <article-title>Variable-length particle swarm optimization for feature selection on high-dimensional classification</article-title>. <source>IEEE Trans. Evol. Comput.</source> <volume>23</volume>, <fpage>473</fpage>&#x2013;<lpage>487</lpage>.</citation></ref>
<ref id="ref33"><citation citation-type="confproc"><person-group person-group-type="author"><name><surname>Tran</surname><given-names>B.</given-names></name> <name><surname>Xue</surname><given-names>B.</given-names></name> <name><surname>Zhang</surname><given-names>M.</given-names></name></person-group> (<year>2019</year>), <source>Adaptive multi-subswarm optimisation for feature selection on high-dimensional classification</source>. <conf-name>GECCO '19: Proceedings of the Genetic and Evolutionary Computation Conference</conf-name>. <fpage>481</fpage>&#x2013;<lpage>489</lpage></citation></ref>
<ref id="ref34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vergara</surname><given-names>J. R.</given-names></name> <name><surname>Est&#x00E9;vez</surname><given-names>P. A.</given-names></name></person-group> (<year>2014</year>). <article-title>A review of feature selection methods based on mutual information</article-title>. <source>Neural Comput. Appl.</source> <volume>24</volume>, <fpage>175</fpage>&#x2013;<lpage>186</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00521-013-1368-0</pub-id></citation></ref>
<ref id="ref35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Villoth</surname><given-names>J. P.</given-names></name> <name><surname>Zivkovic</surname><given-names>M.</given-names></name> <name><surname>Zivkovic</surname><given-names>T.</given-names></name> <name><surname>Abdel-salam</surname><given-names>M.</given-names></name> <name><surname>Hammad</surname><given-names>M.</given-names></name> <name><surname>Jovanovic</surname><given-names>L.</given-names></name> <etal/></person-group>. (<year>2025</year>). <article-title>Two-tier deep and machine learning approach optimized by adaptive multi-population firefly algorithm for software defects prediction</article-title>. <source>Neurocomputing</source> <volume>630</volume>:<fpage>129695</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.neucom.2025.129695</pub-id></citation></ref>
<ref id="ref36"><citation citation-type="confproc"><person-group person-group-type="author"><name><surname>Yan</surname><given-names>X.</given-names></name> <name><surname>Sarkar</surname><given-names>M.</given-names></name> <name><surname>Gebru</surname><given-names>B.</given-names></name> <name><surname>Nazmi</surname><given-names>S.</given-names></name> <name><surname>Homaifar</surname><given-names>A.</given-names></name></person-group> (<year>2021</year>). <source>A supervised feature selection method for mixed-type data using density-based feature clustering</source>. In <conf-name>2021 IEEE International Conference on Systems, Man, and Cybernetics (SMC)</conf-name>. <publisher-name>IEEE</publisher-name>, <fpage>1900</fpage>&#x2013;<lpage>1905</lpage>.</citation></ref>
</ref-list>
</back>
</article>