<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2025.1740598</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Dualistic MADS-box evolution forged legume diversity post-WGD</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Nan</surname><given-names>Haiyang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Chen</surname><given-names>Xinxin</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname><given-names>Jiajia</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Zou</surname><given-names>Mingyang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Shang</surname><given-names>Erxuan</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Guo</surname><given-names>Xinyi</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Kou</surname><given-names>Kun</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3269876/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Engineering Research Center of Agricultural Microbiology Technology, Ministry of Education &amp; Heilongjiang Provincial Key Laboratory of Plant Genetic Engineering and Biological Fermentation Engineering for Cold Region &amp; Key Laboratory of Molecular Biology, College of Heilongjiang Province &amp; School of Life Sciences, Heilongjiang University</institution>, <city>Harbin</city>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff2"><label>2</label><institution>College of Information Engineering, East University of Heilongjiang</institution>, <city>Harbin</city>,&#xa0;<country country="cn">China</country></aff>
<author-notes>
<corresp id="c001"><label>*</label>Correspondence: Kun Kou, <email xlink:href="mailto:koukun@hlju.edu.cn">koukun@hlju.edu.cn</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-01-15">
<day>15</day>
<month>01</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2025</year>
</pub-date>
<volume>16</volume>
<elocation-id>1740598</elocation-id>
<history>
<date date-type="received">
<day>06</day>
<month>11</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>03</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>29</day>
<month>11</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Nan, Chen, Zhang, Zou, Shang, Guo and Kou.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Nan, Chen, Zhang, Zou, Shang, Guo and Kou</copyright-holder>
<license>
<ali:license_ref start_date="2026-01-15">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<p>The MADS-box gene family plays a central role in plant development and adaptation, yet its evolutionary history in legumes is remarkably complex. In this study, we performed a pangenomic analysis across 52 legume species, identifying 4,872 MADS-box genes and reconstructing their phylogeny into 16 subfamilies. Our analysis uncovered a pervasive dualistic evolutionary model driven by distinct duplication mechanisms. Structurally, the genes fall into two categories: the compact, intron-poor Type I and the complex, intron-rich Type II. We demonstrate that whole-genome duplication (WGD) serves as the major driver (42.2%) behind the expansion of the conserved core genome, which includes key floral regulators such as the &#x201c;ABCDE model&#x201d; genes. These WGD-derived genes are under strong purifying selection, thereby ensuring developmental stability. In contrast, small-scale duplication (SSD) fuels the expansion of the dynamic periphery, primarily composed of Type I genes and stress-responsive clades, which evolve under relaxed selection and promote lineage-specific innovation&#x2014;as strikingly exemplified by the massive tandem expansion of the SVP subfamily in Prosopis. Pangenome analysis confirmed that WGD-derived genes were enriched in the conserved core genome, underpinning essential functions, whereas SSD-derived genes dominated the variable genome and acted as a source of genetic novelty. Transcriptome analysis in soybean identified four organ-specific expression modules, predominantly comprising Type II core genes. Under biotic and abiotic stress, WGD-derived gene pairs exhibited prominent asymmetric expression. The expression divergence was validated by qRT-PCR. Overall, our findings establish a unified framework for MADS-box gene evolution in legumes, illustrating how divergent duplication mechanisms and selective pressures have collectively shaped a gene family critical to both evolutionary innovation and developmental stability.</p>
</abstract>
<kwd-group>
<kwd>asymmetric expression</kwd>
<kwd>legume</kwd>
<kwd>MADS-box</kwd>
<kwd>SSD</kwd>
<kwd>WGD</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This work was supported by Natural Science Foundation of Heilongjiang Province (LH2024C092) and Basic Scientific Research Business Fund of Colleges and Universities of Heilongjiang Province (2023-KYYWF-1491).</funding-statement>
</funding-group>
<counts>
<fig-count count="10"/>
<table-count count="0"/>
<equation-count count="0"/>
<ref-count count="79"/>
<page-count count="19"/>
<word-count count="8102"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Functional and Applied Plant Genomics</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Whole-genome duplication (WGD), a form of macro-mutation, is a primary engine of evolution in eukaryotes, and it is so pervasive in plants that all extant angiosperms are considered to be paleopolyploids (<xref ref-type="bibr" rid="B12">Clark and Donoghue, 2018</xref>; <xref ref-type="bibr" rid="B62">Soltis et&#xa0;al., 2015</xref>). This explosive, genome-wide event stands in stark contrast to the continuous, localized &#x201c;micro-mutations&#x201d; of small-scale duplications (SSDs)&#x2014;a collection of processes including tandem, proximal, dispersed, and transposed duplications&#x2014;which typically add genes one at a time (<xref ref-type="bibr" rid="B22">Freeling, 2009</xref>; <xref ref-type="bibr" rid="B45">Mascagni, et&#xa0;al., 2021</xref>). While SSDs provide a steady, manageable stream of raw material, WGD is not a simple doubling of gene content but rather the start of a dynamic WGD-fractionation cycle, in which most duplicated genes are eventually lost over millions of years (<xref ref-type="bibr" rid="B29">Hong et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B62">Soltis et&#xa0;al., 2015</xref>). Indeed, without extensive fractionation, some plant genomes would be ten times their current size (<xref ref-type="bibr" rid="B14">Comai, 2005</xref>). The surviving gene duplicates, however, provide vast raw material for innovation through neofunctionalization or subfunctionalization (<xref ref-type="bibr" rid="B27">Guo et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B36">Konrad et&#xa0;al., 2011</xref>; <xref ref-type="bibr" rid="B70">Xue and Fu, 2009</xref>). Yet, WGD imposes a severe genomic shock, often leading to reduced fertility and instability, making most polyploidization events short-lived evolutionary dead-ends (<xref ref-type="bibr" rid="B60">Shimizu, 2022</xref>). For those that persist, a fundamental challenge arises: how to manage massive gene redundancy while maintaining the integrity of complex regulatory networks. The &#x201c;gene dosage balance hypothesis&#x201d; posits that genes encoding components of stoichiometric complexes, such as transcription factor networks, are particularly sensitive to such disruption, creating a strong selective pressure to preserve their relative quantities (<xref ref-type="bibr" rid="B7">Birchler and Veitia, 2010</xref>, <xref ref-type="bibr" rid="B8">2014</xref>; <xref ref-type="bibr" rid="B15">Conant et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B39">Liang and Fernandez, 2008</xref>; <xref ref-type="bibr" rid="B59">Shi et&#xa0;al., 2020</xref>). This establishes a fundamental tension for any post-polyploid lineage: how to resolve the conflict between the immense creative potential of gene duplication and the stringent homeostatic constraints required for survival?</p>
<p>The Fabaceae (legume) family represents a spectacular evolutionary success, ranking as the third-largest angiosperm family with nearly 20,000 species and dominating ecosystems worldwide (<xref ref-type="bibr" rid="B72">Yu et&#xa0;al., 2025</xref>; <xref ref-type="bibr" rid="B78">Zhao et&#xa0;al., 2021a</xref>). Its rapid diversification is intimately linked to a complex history of polyploidy, highlighted by a major WGD event shared among the Papilionoideae subfamily occurring approximately 59 million years ago (Mya), shortly after the Cretaceous-Paleogene (K-Pg) mass extinction (~66 Mya) (<xref ref-type="bibr" rid="B35">Koenen et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B66">Vanneste et&#xa0;al., 2014</xref>). This timing suggests a compelling hypothesis: the genomic plasticity conferred by WGD provided a critical adaptive advantage, enabling ancestral legumes to colonize the numerous ecological niches left vacant by the extinction event. This scenario raises a fundamental question: What were the specific genomic features that allowed the ancestral legume to harness the genetic instability of WGD, leading not to extinction but to an explosion of diversity and key innovations?</p>
<p>A key to this success lies in the evolutionary dynamics of master regulatory gene families, chief among them the MADS-box family. Named after its founding members from fungi (<italic>MCM1</italic>), plants (<italic>AGAMOUS</italic>, <italic>DEFICIENS</italic>), and animals (<italic>SRF</italic>), this ancient transcription factor lineage orchestrates nearly all major developmental transitions in plants (<xref ref-type="bibr" rid="B25">Goyal et&#xa0;al., 2023</xref>). Their function relies on the assembly of multiprotein complexes that bind to specific CArG-box DNA motifs (CC(A/T)6GG) in target genes (<xref ref-type="bibr" rid="B1">Airoldi and Davies, 2012</xref>; <xref ref-type="bibr" rid="B46">Melzer and Theissen, 2009</xref>; <xref ref-type="bibr" rid="B57">Shen et&#xa0;al., 2021</xref>). This mechanism is famously exemplified by the &#x201c;floral quartet model&#x201d;, which provides the molecular basis for the &#x201c;ABCDE model&#x201d; of flower development (<xref ref-type="bibr" rid="B2">Ali et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B41">Liu et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B46">Melzer and Theissen, 2009</xref>). Critically, the plant MADS-box family is partitioned into two ancient lineages with distinct structures (<xref ref-type="bibr" rid="B5">Bartlett, 2017</xref>; <xref ref-type="bibr" rid="B49">Ng and Yanofsky, 2001</xref>). The Type II (MIKC) genes possess a characteristic four-domain structure: a MADS (M) domain for DNA binding, an Intervening (I) domain for dimerization specificity, a C-terminal (C) domain for transcriptional activation, and a Keratin-like (K) domain (<xref ref-type="bibr" rid="B30">Hu et&#xa0;al., 2023</xref>; <xref ref-type="bibr" rid="B64">Thangavel and Nayar, 2018</xref>; <xref ref-type="bibr" rid="B75">Zhao et&#xa0;al., 2021a</xref>). The evolution of this K domain, which acts as a scaffold for forming higher-order complexes, was a milestone that enabled the combinatorial control necessary for complex morphologies (<xref ref-type="bibr" rid="B3">Ambrose et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B44">Manzoor et&#xa0;al., 2024</xref>). In contrast, the structurally simpler and less-studied Type I genes generally lack this K domain and play critical but enigmatic roles in reproduction, particularly in gametophyte and endosperm development (<xref ref-type="bibr" rid="B13">Colombo et&#xa0;al., 2008</xref>; <xref ref-type="bibr" rid="B16">De Bodt et&#xa0;al., 2003</xref>; <xref ref-type="bibr" rid="B48">Nam et&#xa0;al., 2004</xref>).</p>
<p>The ancient structural dichotomy between Type I and Type II MADS-box genes provided a critical genomic template for the legume-specific WGD. We hypothesized that this WGD event acted as a powerful selective filter on these pre-existing lineages. Specifically, we posited that WGD preferentially preserved the complex, dosage-sensitive Type II core to maintain stability, while SSD fueled the expansion of the streamlined Type I periphery to drive innovation. In this study, we undertook a large-scale phylogenomic investigation of 4,872 MADS-box genes across 52 Fabaceae species to reconstruct their duplication histories and trace their evolutionary trajectories. By integrating this deep evolutionary framework with functional insights from expression analyses in <italic>Glycine max</italic>, this study aims to dissect the contrasting roles of WGD versus SSD in shaping this pivotal gene family.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Genome data acquisition and species tree reconstruction</title>
<p>We retrieved the genome assemblies and protein annotations for 52 Fabaceae species from multiple public databases, including NCBI, plantGIR (<xref ref-type="bibr" rid="B40">Liu et&#xa0;al., 2024</xref>) and LGRPv2 (<xref ref-type="bibr" rid="B72">Yu et&#xa0;al., 2025</xref>). Detailed information was provided in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S1</bold></xref>. To establish a robust species evolutionary framework, a consensus topology (branching structure) was obtained from the TimeTree 5 web server (<xref ref-type="bibr" rid="B38">Kumar et&#xa0;al., 2022</xref>) and LGRPv2 (<xref ref-type="bibr" rid="B72">Yu et&#xa0;al., 2025</xref>). Documented WGD and whole genome triplications (WGT) events were manually annotated onto the species tree based on published literature (<xref ref-type="bibr" rid="B32">Jiao et&#xa0;al., 2012</xref>; <xref ref-type="bibr" rid="B72">Yu et&#xa0;al., 2025</xref>; <xref ref-type="bibr" rid="B74">Zhang et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B78">Zhao et&#xa0;al., 2021b</xref>).</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Identification of MADS-box gene family in Fabaceae</title>
<p>The HMM profile of the conserved SRF-TF domain (PF00319) was used to search against the proteomes of all 52 Fabaceae species. To provide a broader evolutionary context, we also searched the proteomes of selected outgroup species: <italic>Polygala tenuifolia</italic>, <italic>Vitis vinifera</italic>, <italic>Amborella trichopoda</italic>, <italic>Nymphaea colorata</italic>, <italic>Arabidopsis thaliana</italic>, and <italic>Oryza sativa</italic> (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S1</bold></xref>). All searches were conducted using HMMER (v3.4) with a cutoff E-value cutoff of 1&#xd7;10<sup>-5</sup> (<xref ref-type="bibr" rid="B51">Potter et&#xa0;al., 2018</xref>). To ensure high accuracy, all candidate sequences were manually curated. Sequences shorter than 100 amino acids were removed, and the presence of the MADS domain in the remaining candidates was verified using the NCBI Conserved Domain Database (NCBI-CDD) web server.</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Phylogenetic analysis and subfamily classification</title>
<p>To elucidate the evolutionary relationships within the MADS-box family, we performed a multi-step phylogenetic analysis. The full-length amino acid sequences of all identified MADS-box proteins were aligned using MAFFT (v7.505) (<xref ref-type="bibr" rid="B33">Katoh and Standley, 2013</xref>) and then trimmed to remove poorly aligned regions using trimAl (v1.4) (<xref ref-type="bibr" rid="B10">Capella-Guti&#xe9;rrez et&#xa0;al., 2009</xref>). A maximum likelihood (ML) phylogenetic tree was constructed from the trimmed alignment using FastTree (v2.1.11) with the JTT (Jones-Taylor-Thornton) protein substitution model. Local branch support was assessed using the Shimodaira-Hasegawa-like (SH-like) method, based on 1,000 resamples, as implemented in FastTree (<xref ref-type="bibr" rid="B52">Price et&#xa0;al., 2009</xref>). Based on the topology of the phylogenetic tree and established domain architectures from foundational studies (<xref ref-type="bibr" rid="B34">Kaufmann et&#xa0;al., 2005</xref>; <xref ref-type="bibr" rid="B50">Parenicov&#xe1; et&#xa0;al., 2003</xref>). Tree visualization was done with Evolview (<xref ref-type="bibr" rid="B63">Subramanian et&#xa0;al., 2019</xref>).</p>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Gene structure and motif analysis</title>
<p>Gene structure statistics, including gene length, amino acid length, intron length, intron/exon number were retrieved from genomic annotation GFF3 files for each species. To investigate the conservation and divergence of protein architecture, we analyzed the conserved motifs within each MADS-box subfamily using the MEME suite (v5.5.8) (<xref ref-type="bibr" rid="B4">Bailey et&#xa0;al., 2015</xref>). The analysis was set to identify a maximum of 5 motifs and only those that appear in over 50% of all sequences were selected for visualization.</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Analysis of duplication events and selection pressure</title>
<p>The protein sequences were aligned using Diamond v2.0.5.143 in blastp mode with a E-value cutoff 0.001 and max-target-seqs 5 (<xref ref-type="bibr" rid="B9">Buchfink et&#xa0;al., 2021</xref>). Synteny analysis was conducted for each species using MCScanX with the following parameters: a minimum of colinear genes were required to define a block (-s 5), and the maximum gene gap allowed between collinear genes was set to (-m 25) (<xref ref-type="bibr" rid="B67">Wang et&#xa0;al., 2012</xref>). Based on the synteny information and genomic locations, duplicated gene pairs were classified into five types: WGD, tandem, proximal, dispersed, and transposed, using the DupGen-finder (v1.0.0) (<xref ref-type="bibr" rid="B54">Qiao et&#xa0;al., 2019</xref>). The rates of synonymous (<italic>Ks</italic>) and non-synonymous (<italic>Ka</italic>) substitutions were calculated using KaKs_Calculator (v2.0). To mitigate the impact of noise and artifacts on evolutionary rate estimates, only gene pairs with <italic>Ks</italic> values &lt; 2 and <italic>P</italic>-Value &lt; 0.05 were included in subsequent analyses. The ratio Ka/Ks was then used to infer the selection pressure acting on these duplicated genes.</p>
</sec>
<sec id="s2_6">
<label>2.6</label>
<title>Pangenome analysis of MADS-box subfamilies</title>
<p>To assess the conservation and dispensability of MADS-box subfamilies across the Fabaceae, we conducted a pangenome analysis. For each subfamily, protein sequences from all 52 species were clustered into orthologous groups (OGs) using CD-HIT (v4.8.1) a 40% sequence identity threshold (<xref ref-type="bibr" rid="B23">Fu et&#xa0;al., 2012</xref>). The resulting clusters were categorized into four frequency-based groups according to established pangenome nomenclature (<xref ref-type="bibr" rid="B65">Tong et&#xa0;al., 2025</xref>): (i) core (present in all 52 Fabaceae species), (ii) soft-core (present in &gt;90% of species), (iii) shell (present in 10%&#x2013;90% of species), (iv) cloud (present in &lt;10% of species).</p>
</sec>
<sec id="s2_7">
<label>2.7</label>
<title>Gene expression analysis in soybean</title>
<p>To investigate the functional divergence of MADS-box genes, particularly among duplicated pairs, we analyzed a large-scale RNA-seq dataset for soybean (<italic>Glycine max</italic>). We retrieved the expression profiles of 3,638 RNA-seq samples of soybean derived from various tissues and abiotic and biotic stresses from the soybean RNA-seq Database (<ext-link ext-link-type="uri" xlink:href="https://plantrnadb.com/soybean/">https://plantrnadb.com/soybean/</ext-link>) (<xref ref-type="bibr" rid="B73">Yu et&#xa0;al., 2022</xref>) (<xref ref-type="supplementary-material" rid="SM2"><bold>Supplementary Table S2</bold></xref>). FPKM values were extracted for all identified soybean MADS-box genes. These values were used to analyze tissue-specific expression patterns and to compare the expression divergence between duplicated gene pairs derived from WGD and SSD events.</p>
<p>To identify organ-specific expression modules, hierarchical clustering was performed using the pheatmap package in R. Prior to clustering, FPKM values were log2-transformed and standardized using <italic>z</italic>-scores to highlight expression trends rather than absolute abundance. A distance matrix was computed using the Euclidean method, and clustering was conducted using the Ward&#x2019;s minimum variance method (Ward.D2). The resulting dendrogram was cut to define four distinct expression modules.</p>
</sec>
<sec id="s2_8">
<label>2.8</label>
<title>Plant cultivation, treatments, RNA isolation, and qRT-PCR</title>
<p>To validate the expression patterns, soybean seeds were germinated on moist paper for 5 days and then transferred into a light chamber under a 16h:8h, light: dark photoperiod with 60% relative humidity at 25 &#xb0;C. The seedlings were grown in pots containing a 2:1 mixture of forest soil: vermiculite for 2 weeks. Select plants with uniform growth and divide them into four groups. For drought treatment, the seedlings roots were rinsed with water to remove adherent soil without damaging root hairs. Then excess surface water was blotted using filter papers for the induction of rapid drought for 0 (CK), 1, 3, 8 and 12 hours. For NaCl treatment, the seedlings were treated separately with 1/2 Hoagland nutrient solution, 150 mM NaCl solution and 200 mM NaCl solution on different periods (0, 1, 3, 8 and 12 hours), respectively. Leaf samples are collected into test tubes, rapidly frozen with liquid nitrogen, and subsequently used for RNA extraction. Total RNA was extracted using the Ultrapure RNA Kit (CWBIO, China), which includes TRIzon Reagent as a key component, and cDNA was synthetized with M-MLV reverse transcriptase kit (Takara). Quantitative real-time polymerase chain reaction (qRT-PCR) was performed with SYBR Premix Ex (TaKaRa) on the Roche Light Cycler 480 system (Roche, Germany) with PCR kit (Roche, Germany). The soybean endogenous gene <italic>TUBULIN</italic> (<italic>Glyma.05G157300</italic>) was used as an internal control, and the relative expression levels of examined genes were calculated using the 2<sup>-&#x394;&#x394;Ct</sup> method (<xref ref-type="bibr" rid="B42">Livak and Schmittgen, 2001</xref>). Three biological replications were performed in each test. The primers are listed in <xref ref-type="supplementary-material" rid="SM3"><bold>Supplementary Table S3</bold></xref>.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>Identification and phylogenetic classification of MADS-box in Fabaceae</title>
<p>To systematically map the MADS-box gene family across the Fabaceae, we conducted genome-wide search in 52 species of legumes that represent three major subfamilies: 38 species from the Papilionoideae subfamily, 11 from the Caesalpinioideae, and 3 from the Cercidoideae (<xref ref-type="supplementary-material" rid="SM4"><bold>Supplementary Table S4</bold></xref>). A total of 4,872 high-confidence MADS-box genes were identified, comprising 2,032 Type I and 2,840 Type II (MIKC) members (<xref ref-type="supplementary-material" rid="SM4"><bold>Supplementary Table S4</bold></xref>). To elucidate the evolutionary relationships more clearly, we included several evolutionarily significant outgroup species in our analysis, encompassing, including <italic>Polygala tenuifolia</italic>, <italic>Vitis vinifera</italic>, <italic>Amborella trichopoda</italic>, <italic>Nymphaea colorata</italic>, <italic>Arabidopsis thaliana</italic>, <italic>Oryza sativa</italic>, and conducted identification for these species as well (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Tables S1</bold></xref>, <xref ref-type="supplementary-material" rid="SM4"><bold>S4</bold></xref>). The resulting phylogeny clearly partitions the family into 16 subfamilies (<xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref>). The Type I lineage is the largest branch, comprising the M&#x3b1;, M&#x3b2;, and M&#x3b3; clades, with M&#x3b2; and M&#x3b3; showing a closer relationship. The Type II lineage consists of 13 distinct clades, with clear clustering observed among core floral development genes. Among them, AG/STK, SOC1, FLC, AGL6, SEP, and AP1/FUL are clustered together, suggesting a closer phylogenetic relationship. Additionally, the AP3/PI, BS, and AGL12 are also clustered together, indicating a closer relationship. The other clades in Type II are relatively independent, indicating that they may have undergone independent evolution.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Phylogenetic dichotomy partitions the Fabaceae MADS-box family into type I and type II lineages.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-16-1740598-g001.tif">
<alt-text content-type="machine-generated">Phylogenetic tree diagram showing two types, Type I in blue and Type II in pink, with labeled branches: AGL6, FLC, SEP, SOC1, AG/STK, AP3/PI, BS, AGL12, AGL17, AGL15, SVP, MIKC*. Sections Ma, M&#x3b2;, and My are marked. Tree scale is 0.3.</alt-text>
</graphic></fig>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Deep structural dichotomy defines the MADS-box family</title>
<p>Beyond their phylogenetic placement, a profound structural dichotomy between Type I and Type II genes became immediately apparent, providing a physical basis for their divergent evolutionary fates.</p>
<p>We observed significant variation in gene architecture across both lineages and subfamilies (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2</bold></xref>). A comprehensive structural survey of the MADS-box gene family among 52 legume species uncovered evolution patterns among different MADS-box subfamilies in three subfamilies (Papilionoideae, Caesalpinioideae and Cercidoideae) (<xref ref-type="fig" rid="f2"><bold>Figures&#xa0;2A&#x2013;E</bold></xref>). Gene length exhibits significant variation across different lineages, with Caesalpinioideae possessing longer gene (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2A</bold></xref>) and intron lengths (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2C</bold></xref>). This suggests that differences in intron length among lineages may contribute to variations in gene length. In contrast, amino acid sequence length shows no significant differences among the three lineages (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2B</bold></xref>), highlighting the high conservation of coding regions within the Fabaceae. Regarding intron number (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2D</bold></xref>) and CDS number (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2E</bold></xref>), Cercidoideae consistently have slightly higher values than Papilionoideae, underscoring the divergent gene structures present in different species lineages.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Structural dichotomy distinguishes type I and type II MADS-box genes. Boxplot gene length, Amino acid (AA) length, intron length, intron number and CDS number among three species clades <bold>(A&#x2013;E)</bold> and subfamilies <bold>(F)</bold>. Statistical significance was assessed using a t.test. Asterisks indicate statistical significance (<italic>P</italic> &lt; 0.001). Non-significant comparisons are not marked.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-16-1740598-g002.tif">
<alt-text content-type="machine-generated">Box plots illustrating various genetic metrics across three families: Papilionoideae, Caesalpinioideae, and Cercidoideae. Metrics include gene length, amino acid length, intron length, intron number, and CDS number. Additional plots in panel F compare these metrics across different gene categories like MIKC*, AP1/FUL, and others. Statistical significance is marked with asterisks.</alt-text>
</graphic></fig>
<p>Type II genes are structurally complex, with an average length of 8,325 bp and typically containing 6 to 8 introns; some subfamilies, such as AGL17 (12,673 bp), SOC1 (13,148 bp), and FLC (12,916 bp), are particularly long due to extensive introns (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2F</bold></xref>). In stark contrast, Type I genes are structurally streamlined, with averaging over 9 introns per gene. Their average gene length is only 1,251 bp, and a remarkable 68.6% of genes are intronless and 91.04% have one or fewer introns. This pattern holds across Type I subfamilies, with 75.38% of M&#x3b1; genes, 65.58% of M&#x3b2; genes, and 61.20% of M&#x3b3; genes lacking introns entirely (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2F</bold></xref>).</p>
<p>Motif analysis of the MADS domain further reinforces this dichotomy (<xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3</bold></xref>). Key MADS domains SRF-like domain (CDD:238166) were identified in Type-I (<xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3A</bold></xref>) and MEF2-like domain (CDD:238165) were identified in Type-II (<xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3B</bold></xref>). The MADS domain, typically ranging from 71 to 83 amino acids in length, is highly conserved and merits a detailed analysis of its sequence. All Type I proteins contain a highly conserved SRF-like domain (CDD:238166) characterized by two consensus motifs: &#x201c;MGRKKIELKKISNDSARKVTFSKRKKGLFKK&#x201d; and &#x201c;ASELSTLCGVEACAIVFSPGD&#x201d;. All Type II proteins feature a MEF2-like domain (CDD:238165), also defined by two motifs, but their primary consensus sequences &#x201c;MGRGKIEJKRIENKTNRQVTFSKRRNGLLKKAYELSVLCDAEVALIIFSS&#x201d; and &#x201c;TGKLYEYASSSMMEK&#x201d; are more highly conserved than its Type I counterpart and shows distinct positional variations among subfamilies. For example, in the AG/STK subfamily, it starts at the 21st amino acid from the N-terminus, while in the FLC subfamily, it begins at the 11th amino acid. In the AGL6 subfamily, there are 10 amino acids with higher divergence between the two motifs. It suggests fine-scale structural evolution even within this conserved domain.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Conserved motif analysis reinforces the divergence of type I and type II MADS domains. Conserved MADS-domain motifs for <bold>(A)</bold> Type I subfamilies, and <bold>(B)</bold> Type II subfamilies. Sequence logos illustrate amino acid conservation; schematics below show motif positions. The statistical significance (E-value) for each motif is indicated next to its label in the figure key.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-16-1740598-g003.tif">
<alt-text content-type="machine-generated">Sequence logos depicting amino acid frequencies across different protein types. Panel A shows Type I proteins with subtypes M&#x3b1;, M&#x3b2;, and M&#x3b3;. Panel B displays Type II proteins, including MIKC, AP1/FUL, AP3/PI, AG/STK, SEP, AGL 6, AGL12, AGL15, AGL17, SOC1, SVP, AGL32, and FLC, illustrating diverse sequence patterns.</alt-text>
</graphic></fig>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Dynamic history of lineage-specific expansion and gene loss</title>
<p>The total MADS-box gene count varies dramatically across the Fabaceae, from 60 in <italic>Cercis canadensis</italic> to 177 in <italic>Melilotus albus</italic>, reflecting a dynamic evolutionary history of gene gain and loss (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4</bold></xref>). Gene number expansion is often linked to polyploidy; the recent WGD in <italic>Glycine</italic> genus, which contrasts with other species. For example, the Type-I subfamily in soybean comprises 70 MADS-box genes, with the M&#x3b1;, M&#x3b2;, and M&#x3b3; subfamilies containing 38, 10, and 22 genes, respectively. The Type-II subfamily has a total of 96 genes, with the number of genes in different subfamilies ranging from 2 to 12. Furthermore, we observed specific expansions in some subfamilies in some species. Specifically, the number of genes in the Type-I M&#x3b1; and M&#x3b3; subfamilies in <italic>Glycine</italic>, <italic>Medicago</italic>, <italic>Melilotus</italic>, and <italic>Lupinus</italic> is significantly higher than in other species. Similarly, the number of genes in the SVP and AGL17 subfamilies of Type-II in Prosopis exceeds that in other species.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>The MADS-box family exhibits a dynamic history of expansion and contraction across the Fabaceae. MADS-box gene family size mapped onto a species cladogram for 52 Fabaceae species. Heatmaps show total gene count and counts per subfamily, revealing wide variation, lineage-specific expansions, and frequent gene loss. The outgroup species Polygala tenuifolia (Polygalaceae) is highlighted in a distinct color to visually root the Fabaceae clade.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-16-1740598-g004.tif">
<alt-text content-type="machine-generated">Phylogenetic tree and heatmap illustrating polyploidization events and histone quantity across multiple plant species. The tree categorizes species into lineages such as Fabaceae, Brassicaceae, and Poaceae. Polyploidization events are marked by squares in colors representing different gene duplications. The heatmap displays Type I and Type II histone quantities, with color gradients indicating quantity levels. Key species include Vigna hirtella, Glycine max, and Arabidopsis thaliana. The legend explains the coding for polyploidization events and major lineages.</alt-text>
</graphic></fig>
<p>Conversely, gene loss has also sculpted this family. TM8 genes were lost in all Fabaceae species surveyed but present in other species, such as grape and <italic>Amborella</italic>. FLC orthologues were mainly detected in <italic>Glycine</italic>, <italic>Dalbergia</italic> (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4</bold></xref>) and BS, as a sister group of AP3/PI, also lost in 6 species (<italic>Acacia crassicarpa</italic>, <italic>Bauhinia championii</italic>, <italic>Biancaea sappan</italic>, <italic>Delonix regia</italic>, <italic>Senna siamea</italic>, <italic>Vicia faba</italic>, and <italic>Vigna umbellata</italic>), suggesting recurrent, lineage-specific gene loss events.</p>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>The dualistic engine of evolution: WGD-driven conservation versus SSD-driven innovation</title>
<p>To unravel the mechanisms behind this dynamic history, we traced the duplication origins of all genes (<xref ref-type="fig" rid="f5"><bold>Figures&#xa0;5</bold></xref>, <xref ref-type="fig" rid="f6"><bold>6</bold></xref>). This revealed a striking dualistic evolutionary model. We categorized the MADS-box genes into six duplication types, including WGD, tandem, dispersed, transposed, proximal, and singleton (<xref ref-type="supplementary-material" rid="SF1"><bold>Supplementary Figure S1</bold></xref>). Among these, WGD was the predominant type in legumes, accounting for 42.2% of the cases. This was followed by dispersed duplication (16.2%) and tandem duplication (16.1%), which exhibited comparable proportions.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Legume species employ divergent duplication strategies to shape their MADS-box repertoires. Species-specific duplication strategies for MADS-box gene families. The left side displays the phylogenetic tree of the species, with branch lengths not directly proportional to the timescale. Bar plots show the counts (middle) and proportions (right) of genes derived from different duplication modes.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-16-1740598-g005.tif">
<alt-text content-type="machine-generated">Phylogenetic tree showing relationships among legume species, with colored branches representing major lineages: Papilionoideae, Cercidoideae, and others. A table alongside lists species names and numerical data on MADS-box gene numbers and ratios, highlighted in shades of red indicating varying values. Symbols for whole-genome duplication (WGD) and whole-genome triplication (WGT) events are marked in blue and red on the tree.</alt-text>
</graphic></fig>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Dualistic duplication engine drives the evolution of the MADS-box family. The absolute number <bold>(A)</bold> and relative ratio (percentage) <bold>(B)</bold> of genes derived from each duplication type across 52 Fabaceae species. Example of <italic>Glycine max</italic> distribution in absolute number <bold>(C)</bold> and relative ratio <bold>(D)</bold>. Scatter plots showing the correlation between WGD retention ratio and gene length <bold>(E)</bold> or intron number <bold>(F)</bold> across MADS-box subfamilies.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-16-1740598-g006.tif">
<alt-text content-type="machine-generated">Figure A shows a heatmap of duplicated type number distribution in Fabaceae across different genes and duplication types, with a color gradient from green to red representing higher values. Figure B displays the percentage distribution with a similar gradient. Figure C depicts a heatmap for Glycine max, indicating lower numbers in a different color scale. Figure D shows the percentage distribution for Glycine max. Figure E presents a scatter plot of WGD ratio against gene length, indicating a positive trend (R&#xb2; = 0.3). Figure F is a scatter plot showing WGD ratio versus intron number with a stronger positive trend (R&#xb2; = 0.52).</alt-text>
</graphic></fig>
<sec id="s3_4_1">
<label>3.4.1</label>
<title>The conserved WGD-driven expansion of type II genes</title>
<p>The expansion of Type II subfamilies, particularly those governing fundamental developmental processes, is tightly coupled to WGD events (<xref ref-type="fig" rid="f5"><bold>Figures&#xa0;5</bold></xref>, <xref ref-type="fig" rid="f6"><bold>6A, B</bold></xref>). Over 60% of the members in key subfamilies like SOC1, SEP, AP3/PI, and AG/STK originated from WGDs. The expansion of several core MADS-box families involved in the &#x201c;ABCDE model&#x201d; of floral organ development showed a tight coupling with WGD events. In the genus <italic>Glycine</italic>, which experienced a recent WGD, subfamilies such as AP1/FUL, AP3/PI, AG/STK, and SEP, as well as other subfamilies like AGL17, SOC1, and SVP, were markedly expanded compared to other legumes (<xref ref-type="fig" rid="f5"><bold>Figures&#xa0;5</bold></xref>, <xref ref-type="fig" rid="f6"><bold>6C, D</bold></xref>). Within these conserved core subfamilies (e.g., AP1/FUL, AP3/PI, and SEP), genes originating from tandem duplication were extremely rare, suggesting that their expansion is under strict functional constraints and occurs primarily through WGD events (<xref ref-type="fig" rid="f5"><bold>Figures&#xa0;5</bold></xref>, <xref ref-type="fig" rid="f6"><bold>6A, B</bold></xref>).</p>
</sec>
<sec id="s3_4_2">
<label>3.4.2</label>
<title>The dynamic periphery&#x2014;SSD-driven expansion of type I genes and lineage-specific type II genes</title>
<p>In stark contrast, all Type I subfamilies evolved dynamically, with their expansion overwhelmingly driven by a suite of SSD events&#x2014;dispersed, proximal, and tandem duplications (<xref ref-type="fig" rid="f6"><bold>Figures&#xa0;6A, B</bold></xref>). This pattern was particularly prominent in the genera <italic>Melilotus</italic> and <italic>Medicago</italic> (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5</bold></xref>). In <italic>Melilotus</italic> albus, for example, out of its large MADS-box family of 177 members, only 9.0% originated from WGD, whereas the combined contribution of dispersed, proximal, and tandem duplications was 82.5% (24.3%, 29.4%, and 28.8%, respectively. In <italic>Medicago</italic>, the contribution from WGD also remained low at 20%-25%, with expansion primarily driven by dispersed duplications. In <italic>Medicago truncatula</italic>, for example, dispersed duplications contributed 41.9%, making it the primary driver of its gene family expansion. This SSD-driven &#x201c;birth-and-death&#x201d; cycle also fuels innovation in specific Type II subfamilies, which are completely decoupled from WGD. A dramatic example is in the genus <italic>Prosopis</italic>, where the SVP subfamily expanded rapidly to 24 members via SSD duplication, accounting for 85.71% of its total 28 members (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4</bold></xref>; <xref ref-type="supplementary-material" rid="SF2"><bold>Supplementary Figure S2</bold></xref>).</p>
<p>To explore the relationship between gene architecture and evolutionary dynamics, we analyzed the correlation between structural characteristics and WGD retention rates across all subfamilies (<xref ref-type="fig" rid="f6"><bold>Figures&#xa0;6E, F</bold></xref>). We observed positive correlations between the WGD ratio and both gene length (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6E</bold></xref>) and average intron number (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6F</bold></xref>). These results indicate that subfamilies with higher structural complexity are more likely to be expanded via WGD, while structurally simpler subfamilies show a lower dependence on WGD.</p>
</sec>
</sec>
<sec id="s3_5">
<label>3.5</label>
<title>Contrasting selection pressures underpin the dualistic pattern</title>
<p>To understand the molecular basis for this dualistic pattern, we contrasted the selection pressures on 912 unique WGD-derived gene pairs and unique 635 SSD-derived gene pairs. Analysis of evolutionary rates revealed that WGD pairs exhibited significantly higher synonymous (<italic>K</italic>s) and non-synonymous (<italic>K</italic>a) substitution rates (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7A</bold></xref>). The median <italic>K</italic>s values of WGD pairs were substantially higher than those of SSD pairs (Wilcox test, <italic>P</italic> &lt; 0.001), indicating that the former diverged earlier.</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Ka/Ks analysis genes. <bold>(A)</bold> Statistical significance was assessed using a wilcox.test. Asterisks indicate statistical significance (<italic>P</italic> &lt; 0.001). <bold>(B)</bold> Ridgeline plots illustrate the density distribution of <italic>Ka</italic>, <italic>Ks</italic>, and Ka/Ks ratios for duplicated gene pairs within each subfamily.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-16-1740598-g007.tif">
<alt-text content-type="machine-generated">Panel A shows three violin plots comparing Ka, Ks, and Ka/Ks ratios between whole genome duplication (WGD) and small-scale duplication (SSD). Ka shows no significant difference, while Ks and Ka/Ks exhibit significant differences marked by asterisks. Panel B displays density plots of Ka, Ks, and Ka/Ks ratios for various gene families, with color gradients indicating density levels.</alt-text>
</graphic></fig>
<p>To reconstruct the fine-scale temporal history of these lineages, we further analyzed the distribution of <italic>K</italic>s across subfamilies (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7B</bold></xref>). This analysis revealed a clear temporal stratification. The conserved Type II subfamilies (e.g., SEP, AP1/FUL, AG/STK) exhibit a bimodal <italic>K</italic>s distribution. In addition to recent duplications, they display a distinct concentration of gene pairs peaks. This suggests that the expansion of the core developmental machinery was a direct legacy of this ancient polyploidy event.</p>
<p>Consistent with these distinct evolutionary trajectories, the analysis of selection pressure showed a completely opposite trend. The Ka/Ks ratios of WGD pairs were significantly lower than those of SSD pairs (Wilcox test, <italic>P</italic> &lt; 0.001) (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7A</bold></xref>), suggesting the MADS-box genes from WGDs are functionally constrained by strong purifying selection, while dynamic genes from SSDs experience more relaxed constraints, affording them greater freedom to accumulate mutations and explore new functions.</p>
</sec>
<sec id="s3_6">
<label>3.6</label>
<title>Pangenome analysis reveals a conserved core and a dispensable periphery</title>
<p>The functional consequences of these divergent evolutionary paths are evident at the pangenome level (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8</bold></xref>). We clustered all genes into 202 orthologous gene groups (OGGs), comprising 7 core clusters (1,891 genes), 5 soft-core clusters (946 genes), 53 shell clusters (1,666 genes), 137 cloud clusters (369 genes) (<xref ref-type="fig" rid="f8"><bold>Figures&#xa0;8A, B</bold></xref>). We further investigated the relationship between gene duplication types and the conservation of MADS-box genes in the legume pangenome (<xref ref-type="fig" rid="f8"><bold>Figures&#xa0;8C, D</bold></xref>). We found that WGD-derived genes were enriched in the core gene set (57.80%), with their prevalence decreasing toward the cloud category (18.70%). Conversely, SSD-derived genes exhibited an opposite trend: they were most abundant in the cloud (81.30%) and least frequent in the core (42.20%). These results suggest that WGD is a major contributor to highly conserved genes, while SSD-derived genes are more often variable or accessory. In addition, our investigation of evolutionary conservation at the subfamily level revealed that the &#x201c;ABCDE model&#x201d; genes&#x2014;<italic>AG</italic>/<italic>STK</italic>, <italic>AGL12</italic>, <italic>AGL17</italic>, <italic>AP1</italic>/<italic>FUL</italic>, <italic>SEP</italic>, and <italic>SOC1</italic>&#x2014;were predominantly classified as core or soft-core genes, The near-universal presence across the 52 species highlights their critical and indispensable functional roles. For example, the high composition proportion of core genes observed in the <italic>AGL12</italic> (100% core genes), <italic>SEP</italic> (97.664%), <italic>AGL17</italic> (95.05%), <italic>SOC1</italic> (94.75%), <italic>AP1</italic>/<italic>FUL</italic> (93.79%), and <italic>AG</italic>/<italic>STK</italic> (81.39%). Conversely, subfamilies like M&#x3b2;, AGL6, AGL15 and FLC subfamilies showed lower conservation, predominantly comprised of shell genes. These results reflect their rapid turnover and variable presence across lineages, and mirror our dualistic model.</p>
<fig id="f8" position="float">
<label>Figure&#xa0;8</label>
<caption>
<p>Pangenome analysis reveals a conserved core of developmental regulators and a dispensable periphery. The distribution of pan-genome family types within orthologous gene groups (OGGs) <bold>(A)</bold> and at the individual gene level <bold>(B)</bold>. The number <bold>(C)</bold> and percentage <bold>(D)</bold> Distribution of different duplication types for core, soft-core, shell, and cloud MADS-box genes. The number <bold>(E)</bold> and percentage <bold>(F)</bold> distribution of MADS-box genes in each category across different subfamilies.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-16-1740598-g008.tif">
<alt-text content-type="machine-generated">Panel A shows a pie chart of OGGs distribution: cloud (67.8%), shell (26.2%), soft-core (2.5%), core (3.5%). Panel B presents a pie chart of gene distribution: shell (34.2%), core (38.8%), soft-core (19.4%), cloud (7.6%). Panel C is a stacked bar chart of gene duplication types across categories, with wgd and singleton as prominent types. Panel D illustrates the percentage distribution of duplication types by category. Panel E is a bar chart depicting gene count by category. Panel F displays the percentage of genes in each category, highlighting variability across categories.</alt-text>
</graphic></fig>
</sec>
<sec id="s3_7">
<label>3.7</label>
<title>Expression divergence of duplicated genes in soybean</title>
<p>A comprehensive global analysis of 3,638 soybean transcriptomes, sourced from diverse tissues under various conditions, has unveiled four distinct organ-specific modules with higher expression levels (<xref ref-type="fig" rid="f9"><bold>Figures&#xa0;9A, B</bold></xref>). Module 1, comprised of 31 genes predominantly from the SEP and AG/STK families, displayed expression highly specific to reproductive tissues (seed coat, flower, endosperm) and but absent in leaves and roots, likely regulating seed maturation and floral organogenesis. We also found a leaf-specific module of seven genes (Module 2), likely involved in photosynthesis and flowering time control. A distinct root-specific module of 12 genes (Module 3), enriched in <italic>AGL12</italic> and <italic>AGL17-like</italic> genes, points to specialized roles in nutrient uptake and root development. Module 4 comprises 13 genes, predominantly from the SOC1 and SVP families, that are widely expressed in both roots and leaves. Our investigation into the cross-module distribution of gene duplication states revealed that the different copies of duplicated genes were systematically partitioned into different modules except for Module 1 (<xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9C</bold></xref>). This pattern implies that expression differentiation in root or leaf has occurred for these duplicated genes.</p>
<fig id="f9" position="float">
<label>Figure&#xa0;9</label>
<caption>
<p>The expression atlas of soybean MADS-box genes unveils highly specialized, organ-specific regulatory modules and significant expression divergence. <bold>(A)</bold> Expression profiles of MADS-box genes across 3,638 samples in soybean. Clustering was performed using hierarchical clustering (Ward.D2 method, Euclidean distance) on row-scaled log2 (FPKM) values. Letters marked in the figure denote modules with higher expression levels. <bold>(B)</bold> Four tissue-specific expression modules identified in <bold>(A)</bold> are highlighted. <bold>(C)</bold> Distribution of duplicated gene pairs across different modules. <bold>(D)</bold> Expression divergence of tandem-duplicated gene pairs across various tissues. <bold>(E)</bold> Expression divergence of whole-genome duplication (WGD)-derived gene pairs across different tissues. <bold>(F)</bold> Expression divergence of WGD-derived gene pairs under abiotic stress conditions. <bold>(G)</bold> Expression divergence of WGD-derived gene pairs under biotic stress conditions.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-16-1740598-g009.tif">
<alt-text content-type="machine-generated">The image contains several panels illustrating gene expression data. Panel A and B are heatmaps showing expression across different tissues, with modules highlighted. Panel C is a flow diagram depicting connections between gene modules and expression categories. Panels D, E, F, and G are bar graphs comparing expression levels of tandem genes, whole-genome duplication genes, and genes under abiotic and biotic stress types, respectively. Each graph categorizes expression levels between two expression groups, labeled Duplicate 1 and Duplicate 2.</alt-text>
</graphic></fig>
<p>Furthermore, we focused on the expression divergence between the two main types of gene duplication: tandem duplication and whole-genome duplication (WGD). We focused on tandem duplication as the primary SSD representative because both WGD and tandem duplication are mechanistically distinct and algorithmically clear-cut duplication modes (i.e., syntenic blocks vs. local arrays). In contrast, other SSD categories like dispersed represent heterogeneous, catch-all classifications, making them less suitable for a robust comparison. Tandem duplicated pairs generally showed low expression across most tissues but were specifically upregulated in the endosperm (<xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9D</bold></xref>; <xref ref-type="supplementary-material" rid="SM5"><bold>Supplementary Table S5</bold></xref>). In contrast, WGD-derived pairs exhibited higher and more coordinated expression across multiple tissues, particularly in flowers, seed coats, and pods, supporting their role in conserved developmental programs (<xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9E</bold></xref>). We also assessed the distribution of &#x201c;high-expression, large-divergence&#x201d; gene pairs&#x2014;defined as those with expression levels &gt; 10 and fold-change &gt; 5&#x2014;across different tissues. The highest number of such pairs was identified in the endosperm (17 pairs), followed by the nodule (11 pairs), and the root and seed coat (10 pairs each) (<xref ref-type="supplementary-material" rid="SM6"><bold>Supplementary Table S6</bold></xref>).</p>
<p>In addition, we investigated the evolutionary and expression divergence within soybean transcriptomes in response to stress treatments. Under abiotic stress conditions, WGD-derived gene pairs sustained elevated overall expression levels, yet exhibited marked divergence among paralogs, particularly in response to ozone, salt, and drought stress (<xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9F</bold></xref>). This pattern of asymmetrical expression was even more pronounced under biotic stress. Notably, WGD-derived gene pairs demonstrated exceptionally high expression in response to infections by <italic>Sclerotinia sclerotiorum</italic> and <italic>Rotylenchulus reniformis</italic> (<xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9G</bold></xref>). Under biotic stress conditions, the average fold change of 3.24 for WGD pairs higher than the 2.76-fold change observed under abiotic stress conditions (<xref ref-type="supplementary-material" rid="SM7"><bold>Supplementary Tables S7</bold></xref>, <xref ref-type="supplementary-material" rid="SM8"><bold>S8</bold></xref>). This indicates that not only are asymmetric expression patterns prevalent under biotic stress, but they are also more pronounced compared to abiotic stress.</p>
</sec>
<sec id="s3_8">
<label>3.8</label>
<title>Explore the MADS-box genes expression in soybean under drought and salt stress treatment</title>
<p>We focused on six MADS-box genes responding to abiotic stress treatment (<xref ref-type="fig" rid="f10"><bold>Figure&#xa0;10</bold></xref>). The <italic>Glyma.08G05400</italic>, which is broadly expressed across multiple tissues within module 4, and the <italic>Glyma.19G034600</italic>, which shows leaf-specific high expression in module 2. Two pairs of WGD-derived genes displaying marked expression divergence under abiotic stress&#x2014;<italic>Glyma.05G227200</italic> vs. <italic>Glyma.08G033900</italic> and <italic>Glyma.01G020500</italic> vs. <italic>Glyma.09G201700</italic>&#x2014;were selected for transcriptome validation. Expression analysis revealed that <italic>Glyma.08G05400</italic> was strongly induced under salt stress, with a more than 110-fold increase in leaves after 12 hours relative to the control. Under drought stress, this gene was significantly activated at 3 hours and peaked at 8 hours, exhibiting over 27-fold upregulation. The <italic>Glyma.19G034600</italic> was notably induced at 3 hours under drought stress and reached a maximum at 8 hours, with expression levels exceeding 150-fold that of the control. Among the duplicated gene pairs, both <italic>Glyma.05G227200</italic> and <italic>Glyma.08G033900</italic> were upregulated under drought stress, but their induction levels differed substantially: <italic>Glyma.05G227200</italic> showed over 66-fold induction, whereas <italic>Glyma.08G033900</italic> reached a maximum of only 25-fold. A similar divergence was observed under salt stress, where <italic>Glyma.05G227200</italic> was induced more than 9.13-fold compared to only 3.49-fold for <italic>Glyma.08G033900</italic>. We further analyzed the duplicated pair <italic>Glyma.01G020500</italic> and <italic>Glyma.09G201700.</italic> Under salt stress, both genes were comparably induced, with expression increases exceeding two-fold. Under drought stress, however, <italic>Glyma.01G020500</italic> was upregulated over 15-fold, while <italic>Glyma.09G201700</italic> was downregulated. Collectively, these results clearly demonstrate expression divergence between duplicated gene copies under stress conditions and provide experimental evidence for functional differentiation following whole-genome duplication.</p>
<fig id="f10" position="float">
<label>Figure&#xa0;10</label>
<caption>
<p>Expression of Six MADS-box genes under untreated (CK), drought, and salt conditions by qRT-PCR. <bold>(A)</bold> Expression of six MADS-box genes under drought stress at different time points. <bold>(B)</bold> Expression of six MADS-box genes under salt stress at different time points. Two different concentrations of salt (150 mM and 200 mM) were used. Data represent the mean of three independent biological replicates (&#xb1; SE). Different letters above the bar charts indicate significant differences at <italic>P</italic> &lt; 0.05.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-16-1740598-g010.tif">
<alt-text content-type="machine-generated">Graphs showing relative expression levels of various Glyma genes under drought (A) and salt treatments (B). Each panel compares control (CK) with different treatment durations. Bars in different colors represent 1, 3, 8, and 12-hour intervals. Statistical significance is indicated by letters above the bars.</alt-text>
</graphic></fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<sec id="s4_1">
<label>4.1</label>
<title>A Dualistic evolutionary model resolved the post-WGD paradox in legumes</title>
<p>Our comprehensive analysis of the MADS-box gene family across 52 Fabaceae species reveals a profound dualistic evolutionary pattern that provides a compelling solution to the post-polyploidy paradox of stability versus innovation. To anchor this model in a temporal context, our <italic>K</italic>s distribution analysislocalized the primary burst of WGD-derived gene retention to approximately 59 Mya. Notably, this timing places the shared legume WGD event in the immediate aftermath of the K-Pg mass extinction (<xref ref-type="bibr" rid="B35">Koenen et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B66">Vanneste et&#xa0;al., 2014</xref>). This temporal coincidence supports the hypothesis that polyploidy served as a critical survival strategy, providing the ancestral legume lineage with a surplus of genetic raw material to rapidly colonize ecological niches left vacant by the extinction event.</p>
<p>Crucially, however, the explosive radiation of legumes following this K-Pg boundary WGD was not driven by a monolithic expansion of its master developmental regulators. Instead, we propose a two-speed evolutionary architecture: a conserved core of Type II (MIKC) genes, safeguarded by strong purifying selection after being duplicated by WGD, provided developmental stability. Simultaneously, a dynamic periphery, primarily composed of Type I genes, rapidly evolved through SSDs under relaxed selection, offering a continuous source of genetic novelty. This division of evolutionary roles allowed the ancestral legume genome to reconstruct order from the genomic plasticity of WGD, ensuring the robustness of essential programs while fostering the adaptive potential that fueled its subsequent success.</p>
</sec>
<sec id="s4_2">
<label>4.2</label>
<title>Gene dosage balance as a guardian of developmental integrity</title>
<p>Our finding that core MIKC-type subfamilies expanded primarily via WGD provides strong support for the gene dosage balance hypothesis (<xref ref-type="bibr" rid="B8">Birchler and Veitia, 2014</xref>) (<xref ref-type="bibr" rid="B7">Birchler and Veitia, 2010</xref>; <xref ref-type="bibr" rid="B15">Conant et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B59">Shi et&#xa0;al., 2020</xref>). MADS-box proteins rarely act alone; they function by assembling into stoichiometrically precise multiprotein complexes, such as the heterotetramers of the floral quartet model, to regulate downstream gene networks (<xref ref-type="bibr" rid="B58">Sheng et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B71">Ye et&#xa0;al., 2021</xref>).</p>
<p>According to the dosage balance hypothesis, the random, small-scale duplication of a single component would disrupt this delicate stoichiometry, leading to non-functional complexes and deleterious phenotypes, and would thus be purged by strong purifying selection (<xref ref-type="bibr" rid="B44">Manzoor et&#xa0;al., 2024</xref>; <xref ref-type="bibr" rid="B54">Qiao et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B69">Wilson and Liberles, 2023</xref>). In contrast, a WGD event duplicates the entire network proportionally, preserving the balance and providing a viable pathway for the coordinated expansion of these interconnected regulatory modules (<xref ref-type="bibr" rid="B12">Clark and Donoghue, 2018</xref>; <xref ref-type="bibr" rid="B62">Soltis et&#xa0;al., 2015</xref>).</p>
<p>Our results, which show both the preferential retention of these genes post-WGD and the intense purifying selection acting upon them (low Ka/Ks ratio), empirically validate this theory. This demonstrates how a fundamental biochemical constraint&#x2014;the need for stoichiometric balance&#x2014;acts as a powerful evolutionary filter, preserving the integrity of core developmental machinery through deep time.</p>
</sec>
<sec id="s4_3">
<label>4.3</label>
<title>The dynamic periphery: a crucible for adaptive innovation</title>
<p>In stark contrast to the conserved core, the dynamic periphery driven by SSDs acts as a crucible for adaptive evolution (<xref ref-type="bibr" rid="B17">Defoort et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B21">Ezoe et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B24">Glover et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B43">Magadum et&#xa0;al., 2013</xref>). Our results show that Type I subfamilies, along with specific Type II lineages have undergone rapid, lineage-specific expansions via tandem and other SSDs. This mode of evolution, coupled with the relaxed purifying selection we observed, creates a &#x201c;birth-and-death&#x201d; scenario where new gene copies are constantly generated, providing raw material for neofunctionalization or subfunctionalization (<xref ref-type="bibr" rid="B19">Dort et&#xa0;al., 2024</xref>; <xref ref-type="bibr" rid="B77">Zhao et&#xa0;al., 2015</xref>). Crucially, our analysis suggests that this relaxed selection facilitates distinct functional trajectories depending on the lineage. For the enigmatic Type I subfamily, rapid evolution appears channeled primarily into reproductive specialization. Consistent with their preferential expression in seeds and gametophytes, the high sequence divergence of Type I genes may be driven by the parental conflict hypothesis or the need to establish rapid reproductive barriers, rather than abiotic stress tolerance in general (<xref ref-type="bibr" rid="B47">Mora-Garcia and Goodrich, 2000</xref>). In contrast, the functional shift towards environmental resilience is most prominent in SSD-expanded Type II lineages.</p>
<p>A compelling case for this environmental adaptation is the massive tandem expansion of the SVP subfamily in the arid-adapted genus <italic>Prosopis</italic>. As SVP homologs are known integrators of environmental signals that control flowering time, we hypothesize that this expanded repertoire of <italic>SVP</italic> genes may have allowed <italic>Prosopis</italic> to evolve a more sophisticated and resilient regulatory network to fine-tune its reproductive strategy in a harsh, unpredictable desert environment (<xref ref-type="bibr" rid="B55">Quesada-Traver et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B61">Shu et&#xa0;al., 2013</xref>). This dynamic nature is further reflected in the physical gene architecture itself. The structural analysis revealed that the Papilionoideae lineage possesses significantly more streamlined genes (i.e., fewer and shorter introns) compared to the more ancestral, intron-rich structures seen in Caesalpinioideae. This derived trait of genomic compaction, particularly prevalent in the Type I periphery (<xref ref-type="bibr" rid="B6">Bemer et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B16">De Bodt et&#xa0;al., 2003</xref>), would lower the energetic and temporal costs of transcription. Such streamlining acts as a powerful evolutionary facilitator for the rapid &#x201c;birth-and-death&#x201d; cycles and adaptive exploration that characterize these SSD-driven &#x201c;accessory&#x201d; genes. This provides a powerful example of the evolutionary chain linking genome structural variation, gene family expansion, and species-specific ecological adaptation.</p>
</sec>
<sec id="s4_4">
<label>4.4</label>
<title>WGD as an evolutionary starting point, not an endpoint</title>
<p>Our findings reshape the understanding of WGD&#x2019;s role, casting it not as a deterministic endpoint but as a stochastic &#x201c;starting point&#x201d; that triggers divergent, contingent evolutionary trajectories. The stark contrast between <italic>Bauhinia</italic>, which largely retained its WGD duplicates, and its close relative <italic>Cercis</italic>, which lost them and relied on dispersed duplications for expansion, vividly illustrates this post-polyploidy divergence. This discrepancy likely reflects fundamental differences in genomic stability and evolutionary strategy. <italic>Cercis</italic> is often characterized as possessing a highly stable genome, closely resembling the ancestral legume karyotype (<xref ref-type="bibr" rid="B31">Hyun-oh et&#xa0;al., 2024</xref>). This suggests that <italic>Cercis</italic> may operate under a conservative evolutionary regime where gene dosage balance is strictly enforced, leading to the rapid fractionation of WGD duplicates to restore a diploid-like state.</p>
<p>Conversely, <italic>Bauhinia</italic> (and the Papilionoideae lineages) appears to have leveraged genomic plasticity, retaining a larger repertoire of WGD-derived regulators. This retention may have provided the necessary genetic modularity to evolve complex traits suited for diverse tropical environments. Thus, the fate of WGD genes is not uniform but is sculpted by lineage-specific constraints&#x2014;balancing the immediate cost of genomic instability against the long-term benefit of adaptive potential.</p>
<p>Crucially, this phenomenon of contingent evolution is visible even at finer scales. Within the genus <italic>Prosopis</italic>, two closely related species employed entirely different SSDs strategies (tandem vs. transposed/dispersed) to shape their MADS-box repertoires. This demonstrates that the final architecture of a gene family is not predetermined by WGD alone. Rather, it is the product of a complex interplay between lineage-specific selective pressures and the particular modes of SSDs that predominate, confirming that the period of massive gene loss and rearrangement following a WGD is a critical window for evolutionary innovation (<xref ref-type="bibr" rid="B56">Ren et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B69">Wilson and Liberles, 2023</xref>).</p>
</sec>
<sec id="s4_5">
<label>4.5</label>
<title>Functional divergence and expression bias in soybean after whole-genome duplication</title>
<p>The functional data from our <italic>Glycine max</italic> case study provide a compelling, present-day validation of this evolutionary narrative. The expression patterns of duplicated genes directly reflect their divergent evolutionary origins. WGD-derived pairs within core subfamilies exhibit high, stable, and coordinated expression in key developmental organs, confirming their role as the conserved machinery (<xref ref-type="bibr" rid="B11">Carretero-Paulet and Fares, 2012</xref>; <xref ref-type="bibr" rid="B76">Zhao et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B79">Zhu et&#xa0;al., 2013</xref>). In contrast, the rampant asymmetric expression observed in many duplicated pairs, especially under abiotic and biotic stress, is a clear signature of functional divergence (<xref ref-type="bibr" rid="B26">Gu et&#xa0;al., 2004</xref>; <xref ref-type="bibr" rid="B28">Ha et&#xa0;al., 2007</xref>; <xref ref-type="bibr" rid="B68">Wei et&#xa0;al., 2025</xref>). The divergent or opposing stress responses of duplicated pairs (e.g., <italic>Glyma.05G227200</italic>/<italic>Glyma.08G033900</italic> and <italic>Glyma.01G020500</italic>/<italic>Glyma.09G201700</italic>) suggest their post-duplication subfunctionalization or neofunctionalization (<xref ref-type="bibr" rid="B53">Qian and Zhang, 2014</xref>; <xref ref-type="bibr" rid="B76">Zhao et&#xa0;al., 2020</xref>). This extensive expression divergence generates a reservoir of genes with novel expression patterns, providing the functional basis for the adaptive plasticity that has allowed legumes to thrive in diverse environments (<xref ref-type="bibr" rid="B18">De Smet et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B20">Ebadi et&#xa0;al., 2023</xref>; <xref ref-type="bibr" rid="B28">Ha et&#xa0;al., 2007</xref>; <xref ref-type="bibr" rid="B37">Kou et&#xa0;al., 2022</xref>).</p>
</sec>
<sec id="s4_6">
<label>4.6</label>
<title>Model boundaries, limitations, and future perspectives</title>
<p>It is important to note that the &#x201c;Dualistic Model&#x201d; proposed here represents a dominant evolutionary trend rather than a rigid dichotomy. We observed instances where specific lineages defy general rules under unique selective pressures. A prime example is the SVP subfamily (Type II) in the arid-adapted genus <italic>Prosopis</italic>. Although Type II genes are typically constrained to the conserved core driven by WGD, the SVP lineage in Prosopis has &#x201c;crossed the boundary&#x201d; into the dynamic periphery, undergoing SSD. This suggests that the structural constraints preventing Type II SSD expansion are not absolute. When the adaptive value of diversifying a specific regulator outweighs the cost of genomic instability, evolution can override these constraints.</p>
<p>While our study provides a comprehensive evolutionary framework, these exceptions highlight that our current insights represent a starting point rather than a conclusion. Our conclusions on the adaptive significance of specific gene expansions are primarily based on genomic correlation and expression data, while our deep transcriptomic insights are confined to Glycine max. Furthermore, our focus on a single gene family necessarily simplifies what was undoubtedly a genome-wide phenomenon. Therefore, the most critical next step is to move from evolutionary inference to direct functional validation. CRISPR/Cas9-based functional genomics will be essential for testing the key adaptive hypotheses proposed here, such as dissecting the role of the massively expanded SVP subfamily in the drought tolerance of Prosopis and characterizing the highly stress-responsive, asymmetrically expressed gene pairs from soybean to confirm their roles in climate resilience.</p>
<p>Beyond direct validation, our findings open avenues to address fundamental questions in legume biology and evolution. A major challenge is to unravel the enigma of the rapidly evolving Type I MADS-box genes. An even broader frontier lies in understanding how the MADS-box regulatory network co-evolved with other key legume innovations, such as symbiotic nitrogen fixation, by exploring how these master regulators of root development were potentially co-opted to enable the formation of a novel organ&#x2014;the nodule.</p>
</sec>
</sec>
<sec id="s5" sec-type="conclusions">
<label>5</label>
<title>Conclusion</title>
<p>In this study, we conducted a pangenomic analysis of MADS-box genes across 52 legume species, identifying 4,872 genes and reconstructing their phylogeny into 16 subfamilies. Our analysis revealed a pervasive dualistic evolutionary model driven by distinct duplication mechanisms. WGD-derived genes were primarily enriched in the conserved core genome, which includes essential floral regulators such as the &#x201c;ABCDE model&#x201d; genes. These WGD-derived genes are under strong purifying selection, thereby ensuring developmental stability. In contrast, SSD-derived genes dominate the variable regions of the genome. Evolving under relaxed selection, they facilitate lineage-specific innovation, as exemplified by the massive tandem expansion of the SVP clade in <italic>Prosopis</italic>. This dichotomy is also reflected in gene structure: structurally complex Type II genes tend to expand via WGD, while streamlined Type I genes proliferate through SSD. This structural&#x2013;functional dichotomy was further validated in soybean, where WGD pairs show coordinated developmental expression, and exhibit stress-induced expression divergence. Our findings establish a unified evolutionary framework highlighting how duplication mechanisms and selection pressures jointly shape the legume MADS-box family.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material</bold></xref>. Further inquiries can be directed to the corresponding author.</p></sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>KK: Writing &#x2013; original draft, Writing &#x2013; review &amp; editing, Conceptualization, Funding acquisition, Resources, Supervision, Validation. HN: Data curation, Formal Analysis, Investigation, Methodology, Validation, Writing &#x2013; original draft. XC: Data curation, Methodology, Software, Writing &#x2013; review &amp; editing. JZ: Data curation, Formal Analysis, Software, Writing &#x2013; original draft. MZ: Data curation,&#xa0;Resources, Software, Writing &#x2013; review &amp; editing. ES: Data curation, Formal Analysis, Investigation, Software, Validation, Writing &#x2013; review &amp; editing. XG: Formal Analysis, Investigation, Methodology, Resources, Software, Writing &#x2013; review &amp; editing.</p></sec>
<ack>
<title>Acknowledgments</title>
<p>We thank the Heilongjiang Provincial Key Laboratory of Plant Genetic Engineering and Biological Fermentation Engineering for Cold Region of Heilongjiang University. We appreciate the help of the research assistant.</p>
</ack>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
<sec id="s10" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec id="s11" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p></sec>
<sec id="s12" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2025.1740598/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2025.1740598/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table1.xlsx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"><label>Supplementary Table&#xa0;1</label>
<caption>
<p>Taxon list of species used for our analyses</p>
</caption></supplementary-material>
<supplementary-material xlink:href="Table1.xlsx" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"><label>Supplementary Table&#xa0;2</label>
<caption>
<p>Soybean RNA-seq sample listed used</p>
</caption></supplementary-material>
<supplementary-material xlink:href="Table1.xlsx" id="SM3" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"><label>Supplementary Table&#xa0;3</label>
<caption>
<p>List of primer sequences used in this study</p>
</caption></supplementary-material>
<supplementary-material xlink:href="Table1.xlsx" id="SM4" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"><label>Supplementary Table&#xa0;4</label>
<caption>
<p>MADS-box gene information identified in this study</p>
</caption></supplementary-material>
<supplementary-material xlink:href="Table1.xlsx" id="SM5" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"><label>Supplementary Table&#xa0;5</label>
<caption>
<p>Tandem duplicated gene mean expression in different tissues</p>
</caption></supplementary-material>
<supplementary-material xlink:href="Table1.xlsx" id="SM6" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"><label>Supplementary Table&#xa0;6</label>
<caption>
<p>WGD-derived duplicated gene mean expression in different tissues</p>
</caption></supplementary-material>
<supplementary-material xlink:href="Table1.xlsx" id="SM7" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"><label>Supplementary Table&#xa0;7</label>
<caption>
<p>WGD-derived duplicated gene mean expression in abiotics stress</p>
</caption></supplementary-material>
<supplementary-material xlink:href="Table1.xlsx" id="SM8" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"><label>Supplementary Table&#xa0;8</label>
<caption>
<p>WGD-derived duplicated gene mean expression in biotics stress</p>
</caption></supplementary-material>
<supplementary-material xlink:href="Image1.jpg" id="SF1" mimetype="image/jpeg"><label>Supplementary Figure&#xa0;1</label>
<caption>
<p>Duplication type distributions for 4,872 MADS-box genes.</p>
</caption></supplementary-material>
<supplementary-material xlink:href="Image2.jpg" id="SF2" mimetype="image/jpeg"><label>Supplementary Figure&#xa0;2</label>
<caption>
<p>The duplication distribution for SVP subfamily in reach species. <bold>(A)</bold> is the number distributions and <bold>(B)</bold> is the percentage.</p>
</caption></supplementary-material></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Airoldi</surname> <given-names>C. A.</given-names></name>
<name><surname>Davies</surname> <given-names>B.</given-names></name>
</person-group> (<year>2012</year>). 
<article-title>Gene duplication and the evolution of plant MADS-box transcription factors</article-title>. <source>J. Genet. Genomics</source> <volume>39</volume>, <fpage>157</fpage>&#x2013;<lpage>165</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jgg.2012.02.008</pub-id>, PMID: <pub-id pub-id-type="pmid">22546537</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ali</surname> <given-names>Z.</given-names></name>
<name><surname>Raza</surname> <given-names>Q.</given-names></name>
<name><surname>Atif</surname> <given-names>R. M.</given-names></name>
<name><surname>Aslam</surname> <given-names>U.</given-names></name>
<name><surname>Ajmal</surname> <given-names>M.</given-names></name>
<name><surname>Chung</surname> <given-names>G.</given-names></name>
</person-group> (<year>2019</year>). 
<article-title>Genetic and molecular control of floral organ identity in cereals</article-title>. <source>Int. J. Mol. Sci.</source> <volume>20</volume>, <fpage>2743</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/ijms20112743</pub-id>, PMID: <pub-id pub-id-type="pmid">31167420</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ambrose</surname> <given-names>B. A.</given-names></name>
<name><surname>Smalls</surname> <given-names>T. L.</given-names></name>
<name><surname>Zumajo-Cardona</surname> <given-names>C.</given-names></name>
</person-group> (<year>2021</year>). 
<article-title>All type II classic MADS-box genes in the lycophyte Selaginella moellendorffii are broadly yet discretely expressed in vegetative and reproductive tissues</article-title>. <source>Evol. Dev.</source> <volume>23</volume>, <fpage>215</fpage>&#x2013;<lpage>230</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/ede.12375</pub-id>, PMID: <pub-id pub-id-type="pmid">33666357</pub-id>
</mixed-citation>
</ref>
<ref id="B4">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bailey</surname> <given-names>T. L.</given-names></name>
<name><surname>Johnson</surname> <given-names>J.</given-names></name>
<name><surname>Grant</surname> <given-names>C. E.</given-names></name>
<name><surname>Noble</surname> <given-names>W. S.</given-names></name>
</person-group> (<year>2015</year>). 
<article-title>The MEME suite</article-title>. <source>Nucleic Acids Res.</source> <volume>43</volume>, <fpage>W39</fpage>&#x2013;<lpage>W49</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkv416</pub-id>, PMID: <pub-id pub-id-type="pmid">25953851</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bartlett</surname> <given-names>M. E.</given-names></name>
</person-group> (<year>2017</year>). 
<article-title>Changing MADS-box transcription factor protein-protein interactions as a mechanism for generating floral morphological diversity</article-title>. <source>Integr. Comp. Biol.</source> <volume>57</volume>, <fpage>1312</fpage>&#x2013;<lpage>1321</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/icb/icx067</pub-id>, PMID: <pub-id pub-id-type="pmid">28992040</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bemer</surname> <given-names>M.</given-names></name>
<name><surname>Heijmans</surname> <given-names>K.</given-names></name>
<name><surname>Airoldi</surname> <given-names>C.</given-names></name>
<name><surname>Davies</surname> <given-names>B.</given-names></name>
<name><surname>Angenent</surname> <given-names>G. C.</given-names></name>
</person-group> (<year>2010</year>). 
<article-title>An atlas of type I MADS box gene expression during female gametophyte and seed development in Arabidopsis</article-title>. <source>Plant Physiol.</source> <volume>154</volume>, <fpage>287</fpage>&#x2013;<lpage>300</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1104/pp.110.160770</pub-id>, PMID: <pub-id pub-id-type="pmid">20631316</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Birchler</surname> <given-names>J. A.</given-names></name>
<name><surname>Veitia</surname> <given-names>R. A.</given-names></name>
</person-group> (<year>2010</year>). 
<article-title>The gene balance hypothesis: implications for gene regulation, quantitative traits and evolution</article-title>. <source>New Phytol.</source> <volume>186</volume>, <fpage>54</fpage>&#x2013;<lpage>62</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1469-8137.2009.03087.x</pub-id>, PMID: <pub-id pub-id-type="pmid">19925558</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Birchler</surname> <given-names>J. A.</given-names></name>
<name><surname>Veitia</surname> <given-names>R. A.</given-names></name>
</person-group> (<year>2014</year>). 
<article-title>The Gene Balance Hypothesis: dosage effects in plants</article-title>. <source>Methods Mol. Biol.</source>, <volume>1112</volume><fpage>25</fpage>&#x2013;<lpage>32</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-1-62703-773-0_2</pub-id>, PMID: <pub-id pub-id-type="pmid">24478005</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Buchfink</surname> <given-names>B.</given-names></name>
<name><surname>Reuter</surname> <given-names>K.</given-names></name>
<name><surname>Drost</surname> <given-names>H. G.</given-names></name>
</person-group> (<year>2021</year>). 
<article-title>Sensitive protein alignments at tree-of-life scale using DIAMOND</article-title>. <source>Nat. Methods</source> <volume>18</volume>, <fpage>366</fpage>&#x2013;<lpage>368</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41592-021-01101-x</pub-id>, PMID: <pub-id pub-id-type="pmid">33828273</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Capella-Guti&#xe9;rrez</surname> <given-names>S.</given-names></name>
<name><surname>Silla-Mart&#xed;nez</surname> <given-names>J. M.</given-names></name>
<name><surname>Gabald&#xf3;n</surname> <given-names>T.</given-names></name>
</person-group> (<year>2009</year>). 
<article-title>trimAl: a tool for automated alignment trimming in large-scale phylogenetic analyses</article-title>. <source>Bioinformatics</source> <volume>25</volume>, <fpage>1972</fpage>&#x2013;<lpage>1973</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btp348</pub-id>, PMID: <pub-id pub-id-type="pmid">19505945</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Carretero-Paulet</surname> <given-names>L.</given-names></name>
<name><surname>Fares</surname> <given-names>M. A.</given-names></name>
</person-group> (<year>2012</year>). 
<article-title>Evolutionary dynamics and functional specialization of plant paralogs formed by whole and small-scale genome duplications</article-title>. <source>Mol. Biol. Evol.</source> <volume>29</volume>, <fpage>3541</fpage>&#x2013;<lpage>3551</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/mss162</pub-id>, PMID: <pub-id pub-id-type="pmid">22734049</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Clark</surname> <given-names>J. W.</given-names></name>
<name><surname>Donoghue</surname> <given-names>P. C. J.</given-names></name>
</person-group> (<year>2018</year>). 
<article-title>Whole-genome duplication and plant macroevolution</article-title>. <source>Trends Plant Sci.</source> <volume>23</volume>, <fpage>933</fpage>&#x2013;<lpage>945</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.tplants.2018.07.006</pub-id>, PMID: <pub-id pub-id-type="pmid">30122372</pub-id>
</mixed-citation>
</ref>
<ref id="B13">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Colombo</surname> <given-names>M.</given-names></name>
<name><surname>Masiero</surname> <given-names>S.</given-names></name>
<name><surname>Vanzulli</surname> <given-names>S.</given-names></name>
<name><surname>Lardelli</surname> <given-names>P.</given-names></name>
<name><surname>Kater</surname> <given-names>M. M.</given-names></name>
<name><surname>Colombo</surname> <given-names>L.</given-names></name>
</person-group> (<year>2008</year>). 
<article-title>AGL23, a type I MADS-box gene that controls female gametophyte and embryo development in Arabidopsis</article-title>. <source>Plant J.</source> <volume>54</volume>, <fpage>1037</fpage>&#x2013;<lpage>1048</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1365-313X.2008.03485.x</pub-id>, PMID: <pub-id pub-id-type="pmid">18346189</pub-id>
</mixed-citation>
</ref>
<ref id="B14">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Comai</surname> <given-names>L.</given-names></name>
</person-group> (<year>2005</year>). 
<article-title>The advantages and disadvantages of being polyploid</article-title>. <source>Nat. Rev. Genet.</source> <volume>6</volume>, <fpage>836</fpage>&#x2013;<lpage>846</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nrg1711</pub-id>, PMID: <pub-id pub-id-type="pmid">16304599</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Conant</surname> <given-names>G. C.</given-names></name>
<name><surname>Birchler</surname> <given-names>J. A.</given-names></name>
<name><surname>Pires</surname> <given-names>J. C.</given-names></name>
</person-group> (<year>2014</year>). 
<article-title>Dosage, duplication, and diploidization: clarifying the interplay of multiple models for duplicate gene evolution over time</article-title>. <source>Curr. Opin. Plant Biol.</source> <volume>19</volume>, <fpage>91</fpage>&#x2013;<lpage>98</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.pbi.2014.05.008</pub-id>, PMID: <pub-id pub-id-type="pmid">24907529</pub-id>
</mixed-citation>
</ref>
<ref id="B16">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>De Bodt</surname> <given-names>S.</given-names></name>
<name><surname>Raes</surname> <given-names>J.</given-names></name>
<name><surname>Florquin</surname> <given-names>K.</given-names></name>
<name><surname>Rombauts</surname> <given-names>S.</given-names></name>
<name><surname>Rouze</surname> <given-names>P.</given-names></name>
<name><surname>Theissen</surname> <given-names>G.</given-names></name>
<etal/>
</person-group>. (<year>2003</year>). 
<article-title>Genomewide structural annotation and evolutionary analysis of the type I MADS-box genes in plants</article-title>. <source>J. Mol. Evol.</source> <volume>56</volume>, <fpage>573</fpage>&#x2013;<lpage>586</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00239-002-2426-x</pub-id>, PMID: <pub-id pub-id-type="pmid">12698294</pub-id>
</mixed-citation>
</ref>
<ref id="B17">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Defoort</surname> <given-names>J.</given-names></name>
<name><surname>Van de Peer</surname> <given-names>Y.</given-names></name>
<name><surname>Carretero-Paulet</surname> <given-names>L.</given-names></name>
</person-group> (<year>2019</year>). 
<article-title>The evolution of gene duplicates in angiosperms and the impact of protein-protein interactions and the mechanism of duplication</article-title>. <source>Genome Biol. Evol.</source> <volume>11</volume>, <fpage>2292</fpage>&#x2013;<lpage>2305</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gbe/evz156</pub-id>, PMID: <pub-id pub-id-type="pmid">31364708</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>De Smet</surname> <given-names>R.</given-names></name>
<name><surname>Sabaghian</surname> <given-names>E.</given-names></name>
<name><surname>Li</surname> <given-names>Z.</given-names></name>
<name><surname>Saeys</surname> <given-names>Y.</given-names></name>
<name><surname>Van de Peer</surname> <given-names>Y.</given-names></name>
</person-group> (<year>2017</year>). 
<article-title>Coordinated Functional Divergence of Genes after Genome Duplication in Arabidopsis thaliana</article-title>. <source>Plant Cell</source> <volume>29</volume>, <fpage>2786</fpage>&#x2013;<lpage>2800</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1105/tpc.17.00531</pub-id>, PMID: <pub-id pub-id-type="pmid">29070508</pub-id>
</mixed-citation>
</ref>
<ref id="B19">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Dort</surname> <given-names>H.</given-names></name>
<name><surname>van der Bijl</surname> <given-names>W.</given-names></name>
<name><surname>Wahlberg</surname> <given-names>N.</given-names></name>
<name><surname>Nylin</surname> <given-names>S.</given-names></name>
<name><surname>Wheat</surname> <given-names>C. W.</given-names></name>
</person-group> (<year>2024</year>). 
<article-title>Genome-wide gene birth-death dynamics are associated with diet breadth variation in lepidoptera</article-title>. <source>Genome Biol. Evol.</source> <volume>16</volume>, <elocation-id>evae095</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gbe/evae095</pub-id>, PMID: <pub-id pub-id-type="pmid">38976568</pub-id>
</mixed-citation>
</ref>
<ref id="B20">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ebadi</surname> <given-names>M.</given-names></name>
<name><surname>Bafort</surname> <given-names>Q.</given-names></name>
<name><surname>Mizrachi</surname> <given-names>E.</given-names></name>
<name><surname>Audenaert</surname> <given-names>P.</given-names></name>
<name><surname>Simoens</surname> <given-names>P.</given-names></name>
<name><surname>Van Montagu</surname> <given-names>M.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title>The duplication of genomes and genetic networks and its potential for evolutionary adaptation and survival during environmental turmoil</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>120</volume>, <fpage>e2307289120</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.2307289120</pub-id>, PMID: <pub-id pub-id-type="pmid">37788315</pub-id>
</mixed-citation>
</ref>
<ref id="B21">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ezoe</surname> <given-names>A.</given-names></name>
<name><surname>Shirai</surname> <given-names>K.</given-names></name>
<name><surname>Hanada</surname> <given-names>K.</given-names></name>
</person-group> (<year>2021</year>). 
<article-title>Degree of functional divergence in duplicates is associated with distinct roles in plant evolution</article-title>. <source>Mol. Biol. Evol.</source> <volume>38</volume>, <fpage>1447</fpage>&#x2013;<lpage>1459</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msaa302</pub-id>, PMID: <pub-id pub-id-type="pmid">33290522</pub-id>
</mixed-citation>
</ref>
<ref id="B22">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Freeling</surname> <given-names>M</given-names></name>
</person-group>. (<year>2009</year>). 
<article-title>Bias in plant gene content following different sorts of duplication: tandem, whole-genome, segmental, or by transposition</article-title>. <source>Annu. Rev. Plant Biol</source>. <volume>60</volume>, <fpage>433</fpage>&#x2013;<lpage>53</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1146/annurev.arplant.043008.092122</pub-id>, PMID: <pub-id pub-id-type="pmid">19575588</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Fu</surname> <given-names>L.</given-names></name>
<name><surname>Niu</surname> <given-names>B.</given-names></name>
<name><surname>Zhu</surname> <given-names>Z.</given-names></name>
<name><surname>Wu</surname> <given-names>S.</given-names></name>
<name><surname>Li</surname> <given-names>W.</given-names></name>
</person-group> (<year>2012</year>). 
<article-title>CD-HIT: accelerated for clustering the next-generation sequencing data</article-title>. <source>Bioinformatics</source> <volume>28</volume>, <fpage>3150</fpage>&#x2013;<lpage>3152</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bts565</pub-id>, PMID: <pub-id pub-id-type="pmid">23060610</pub-id>
</mixed-citation>
</ref>
<ref id="B24">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Glover</surname> <given-names>N. M.</given-names></name>
<name><surname>Daron</surname> <given-names>J.</given-names></name>
<name><surname>Pingault</surname> <given-names>L.</given-names></name>
<name><surname>Vandepoele</surname> <given-names>K.</given-names></name>
<name><surname>Paux</surname> <given-names>E.</given-names></name>
<name><surname>Feuillet</surname> <given-names>C.</given-names></name>
<etal/>
</person-group>. (<year>2015</year>). 
<article-title>Small-scale gene duplications played a major role in the recent evolution of wheat chromosome 3B</article-title>. <source>Genome Biol.</source> <volume>16</volume>, <fpage>188</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13059-015-0754-6</pub-id>, PMID: <pub-id pub-id-type="pmid">26353816</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Goyal</surname> <given-names>P.</given-names></name>
<name><surname>Devi</surname> <given-names>R.</given-names></name>
<name><surname>Verma</surname> <given-names>B.</given-names></name>
<name><surname>Hussain</surname> <given-names>S.</given-names></name>
<name><surname>Arora</surname> <given-names>P.</given-names></name>
<name><surname>Tabassum</surname> <given-names>R.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title>WRKY transcription factors: evolution, regulation, and functional diversity in plants</article-title>. <source>Protoplasma</source> <volume>260</volume>, <fpage>331</fpage>&#x2013;<lpage>348</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00709-022-01794-7</pub-id>, PMID: <pub-id pub-id-type="pmid">35829836</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Gu</surname> <given-names>Z.</given-names></name>
<name><surname>Rifkin</surname> <given-names>S. A.</given-names></name>
<name><surname>White</surname> <given-names>K. P.</given-names></name>
<name><surname>Li</surname> <given-names>W. H.</given-names></name>
</person-group> (<year>2004</year>). 
<article-title>Duplicate genes increase gene expression diversity within and between species</article-title>. <source>Nat. Genet.</source> <volume>36</volume>, <fpage>577</fpage>&#x2013;<lpage>579</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/ng1355</pub-id>, PMID: <pub-id pub-id-type="pmid">15122255</pub-id>
</mixed-citation>
</ref>
<ref id="B27">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Guo</surname> <given-names>H.</given-names></name>
<name><surname>Lee</surname> <given-names>T. H.</given-names></name>
<name><surname>Wang</surname> <given-names>X.</given-names></name>
<name><surname>Paterson</surname> <given-names>A. H.</given-names></name>
</person-group> (<year>2013</year>). 
<article-title>Function relaxation followed by diversifying selection after whole-genome duplication in flowering plants</article-title>. <source>Plant Physiol.</source> <volume>162</volume>, <fpage>769</fpage>&#x2013;<lpage>778</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1104/pp.112.213447</pub-id>, PMID: <pub-id pub-id-type="pmid">23580595</pub-id>
</mixed-citation>
</ref>
<ref id="B28">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ha</surname> <given-names>M.</given-names></name>
<name><surname>Li</surname> <given-names>W. H.</given-names></name>
<name><surname>Chen</surname> <given-names>Z. J.</given-names></name>
</person-group> (<year>2007</year>). 
<article-title>External factors accelerate expression divergence between duplicate genes</article-title>. <source>Trends Genet.</source> <volume>23</volume>, <fpage>162</fpage>&#x2013;<lpage>166</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.tig.2007.02.005</pub-id>, PMID: <pub-id pub-id-type="pmid">17320239</pub-id>
</mixed-citation>
</ref>
<ref id="B29">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hong</surname> <given-names>S.</given-names></name>
<name><surname>Lim</surname> <given-names>Y. P.</given-names></name>
<name><surname>Kwon</surname> <given-names>S. Y.</given-names></name>
<name><surname>Shin</surname> <given-names>A. Y.</given-names></name>
<name><surname>Kim</surname> <given-names>Y. M.</given-names></name>
</person-group> (<year>2021</year>). 
<article-title>Genome-wide comparative analysis of flowering-time genes; insights on the gene family expansion and evolutionary perspective</article-title>. <source>Front. Plant Sci.</source> <volume>12</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2021.702243</pub-id>, PMID: <pub-id pub-id-type="pmid">34290729</pub-id>
</mixed-citation>
</ref>
<ref id="B30">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hu</surname> <given-names>J.</given-names></name>
<name><surname>Chen</surname> <given-names>Q.</given-names></name>
<name><surname>Idrees</surname> <given-names>A.</given-names></name>
<name><surname>Bi</surname> <given-names>W.</given-names></name>
<name><surname>Lai</surname> <given-names>Z.</given-names></name>
<name><surname>Sun</surname> <given-names>Y.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>Structural and functional analysis of the MADS-box genes reveals their functions in cold stress responses and flower development in tea plant (Camellia sinensis)</article-title>. <source>Plants (Basel)</source> <volume>12</volume>, <fpage>2929</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/plants12162929</pub-id>, PMID: <pub-id pub-id-type="pmid">37631141</pub-id>
</mixed-citation>
</ref>
<ref id="B31">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hyun-oh</surname> <given-names>L.</given-names></name>
<name><surname>Jacob</surname> <given-names>S. S.</given-names></name>
<name><surname>Qiao</surname> <given-names>X.</given-names></name>
<name><surname>Thulani</surname> <given-names>H.</given-names></name>
<name><surname>Rabnoor</surname> <given-names>B.</given-names></name>
<name><surname>Alex</surname> <given-names>L.</given-names></name>
<etal/>
</person-group>. (<year>2024</year>). 
<article-title>Legume genome structures and histories inferred from Cercis canadensis and Chamaecrista fasciculata genomes</article-title>. <source>BioRxiv</source>. <volume>09.03</volume>. <elocation-id>611065</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/2024.09.03.611065</pub-id>
</mixed-citation>
</ref>
<ref id="B32">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Jiao</surname> <given-names>Y.</given-names></name>
<name><surname>Leebens-Mack</surname> <given-names>J.</given-names></name>
<name><surname>Ayyampalayam</surname> <given-names>S.</given-names></name>
<name><surname>Bowers</surname> <given-names>J. E.</given-names></name>
<name><surname>McKain</surname> <given-names>M. R.</given-names></name>
<name><surname>McNeal</surname> <given-names>J.</given-names></name>
<etal/>
</person-group>. (<year>2012</year>). 
<article-title>A genome triplication associated with early diversification of the core eudicots</article-title>. <source>Genome Biol.</source> <volume>13</volume>, <fpage>R3</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/gb-2012-13-1-r3</pub-id>, PMID: <pub-id pub-id-type="pmid">22280555</pub-id>
</mixed-citation>
</ref>
<ref id="B33">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Katoh</surname> <given-names>K.</given-names></name>
<name><surname>Standley</surname> <given-names>D. M.</given-names></name>
</person-group> (<year>2013</year>). 
<article-title>MAFFT multiple sequence alignment software version 7: improvements in performance and usability</article-title>. <source>Mol. Biol. Evol.</source> <volume>30</volume>, <fpage>772</fpage>&#x2013;<lpage>780</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/mst010</pub-id>, PMID: <pub-id pub-id-type="pmid">23329690</pub-id>
</mixed-citation>
</ref>
<ref id="B34">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kaufmann</surname> <given-names>K.</given-names></name>
<name><surname>Melzer</surname> <given-names>R.</given-names></name>
<name><surname>Theissen</surname> <given-names>G.</given-names></name>
</person-group> (<year>2005</year>). 
<article-title>MIKC-type MADS-domain proteins: structural modularity, protein interactions and network evolution in land plants</article-title>. <source>Gene</source> <volume>347</volume>, <fpage>183</fpage>&#x2013;<lpage>198</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.gene.2004.12.014</pub-id>, PMID: <pub-id pub-id-type="pmid">15777618</pub-id>
</mixed-citation>
</ref>
<ref id="B35">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Koenen</surname> <given-names>E. J. M.</given-names></name>
<name><surname>Ojeda</surname> <given-names>D. I.</given-names></name>
<name><surname>Bakker</surname> <given-names>F. T.</given-names></name>
<name><surname>Wieringa</surname> <given-names>J. J.</given-names></name>
<name><surname>Kidner</surname> <given-names>C.</given-names></name>
<name><surname>Hardy</surname> <given-names>O. J.</given-names></name>
<etal/>
</person-group>. (<year>2021</year>). 
<article-title>The origin of the legumes is a complex paleopolyploid phylogenomic tangle closely associated with the cretaceous-paleogene (K-pg) mass extinction event</article-title>. <source>Syst. Biol.</source> <volume>70</volume>, <fpage>508</fpage>&#x2013;<lpage>526</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/sysbio/syaa041</pub-id>, PMID: <pub-id pub-id-type="pmid">32483631</pub-id>
</mixed-citation>
</ref>
<ref id="B36">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Konrad</surname> <given-names>A.</given-names></name>
<name><surname>Teufel</surname> <given-names>A. I.</given-names></name>
<name><surname>Grahnen</surname> <given-names>J. A.</given-names></name>
<name><surname>Liberles</surname> <given-names>D. A.</given-names></name>
</person-group> (<year>2011</year>). 
<article-title>Toward a general model for the evolutionary dynamics of gene duplicates</article-title>. <source>Genome Biol. Evol.</source> <volume>3</volume>, <fpage>1197</fpage>&#x2013;<lpage>1209</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gbe/evr093</pub-id>, PMID: <pub-id pub-id-type="pmid">21920903</pub-id>
</mixed-citation>
</ref>
<ref id="B37">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kou</surname> <given-names>K.</given-names></name>
<name><surname>Yang</surname> <given-names>H.</given-names></name>
<name><surname>Li</surname> <given-names>H.</given-names></name>
<name><surname>Fang</surname> <given-names>C.</given-names></name>
<name><surname>Chen</surname> <given-names>L.</given-names></name>
<name><surname>Yue</surname> <given-names>L.</given-names></name>
<etal/>
</person-group>. (<year>2022</year>). 
<article-title>A functionally divergent SOC1 homolog improves soybean yield and latitudinal adaptation</article-title>. <source>Curr. Biol.</source> <volume>32 (8), 1728&#x2013;1742</volume>, <fpage>e1726</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cub.2022.02.046</pub-id>, PMID: <pub-id pub-id-type="pmid">35263616</pub-id>
</mixed-citation>
</ref>
<ref id="B38">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kumar</surname> <given-names>S.</given-names></name>
<name><surname>Suleski</surname> <given-names>M.</given-names></name>
<name><surname>Craig</surname> <given-names>J. M.</given-names></name>
<name><surname>Kasprowicz</surname> <given-names>A. E.</given-names></name>
<name><surname>Sanderford</surname> <given-names>M.</given-names></name>
<name><surname>Li</surname> <given-names>M.</given-names></name>
<etal/>
</person-group>. (<year>2022</year>). 
<article-title>TimeTree 5: an expanded resource for species divergence times</article-title>. <source>Mol. Biol. Evol</source>. <volume>39</volume> (<issue>8</issue>), <elocation-id>msac174</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msac174</pub-id>, PMID: <pub-id pub-id-type="pmid">35932227</pub-id>
</mixed-citation>
</ref>
<ref id="B39">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Liang</surname> <given-names>H.</given-names></name>
<name><surname>Fernandez</surname> <given-names>A.</given-names></name>
</person-group> (<year>2008</year>). 
<article-title>Evolutionary constraints imposed by gene dosage balance</article-title>. <source>Front. Biosci.</source> <volume>13</volume>, <fpage>4373</fpage>&#x2013;<lpage>4378</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2741/3010</pub-id>, PMID: <pub-id pub-id-type="pmid">18508516</pub-id>
</mixed-citation>
</ref>
<ref id="B40">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Liu</surname> <given-names>Z.</given-names></name>
<name><surname>Zhang</surname> <given-names>C.</given-names></name>
<name><surname>He</surname> <given-names>J.</given-names></name>
<name><surname>Li</surname> <given-names>C.</given-names></name>
<name><surname>Fu</surname> <given-names>Y.</given-names></name>
<name><surname>Zhou</surname> <given-names>Y.</given-names></name>
<etal/>
</person-group>. (<year>2024</year>). 
<article-title>plantGIR: a genomic database of plants</article-title>. <source>Hortic. Res.</source> <volume>11</volume>, <elocation-id>uhae342</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/hr/uhae342</pub-id>, PMID: <pub-id pub-id-type="pmid">39712867</pub-id>
</mixed-citation>
</ref>
<ref id="B41">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Liu</surname> <given-names>C.</given-names></name>
<name><surname>Zhang</surname> <given-names>J.</given-names></name>
<name><surname>Zhang</surname> <given-names>N.</given-names></name>
<name><surname>Shan</surname> <given-names>H.</given-names></name>
<name><surname>Su</surname> <given-names>K.</given-names></name>
<name><surname>Zhang</surname> <given-names>J.</given-names></name>
<etal/>
</person-group>. (<year>2010</year>). 
<article-title>Interactions among proteins of floral MADS-box genes in basal eudicots: implications for evolution of the regulatory network for flower development</article-title>. <source>Mol. Biol. Evol.</source> <volume>27</volume>, <fpage>1598</fpage>&#x2013;<lpage>1611</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msq044</pub-id>, PMID: <pub-id pub-id-type="pmid">20147438</pub-id>
</mixed-citation>
</ref>
<ref id="B42">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Livak</surname> <given-names>K. J.</given-names></name>
<name><surname>Schmittgen</surname> <given-names>T. D.</given-names></name>
</person-group> (<year>2001</year>). 
<article-title>Analysis of relative gene expression data using real-time quantitative PCR and the 2(-Delta Delta C(T)) Method</article-title>. <source>Methods</source> <volume>25</volume>, <fpage>402</fpage>&#x2013;<lpage>408</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1006/meth.2001.1262</pub-id>, PMID: <pub-id pub-id-type="pmid">11846609</pub-id>
</mixed-citation>
</ref>
<ref id="B43">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Magadum</surname> <given-names>S.</given-names></name>
<name><surname>Banerjee</surname> <given-names>U.</given-names></name>
<name><surname>Murugan</surname> <given-names>P.</given-names></name>
<name><surname>Gangapur</surname> <given-names>D.</given-names></name>
<name><surname>Ravikesavan</surname> <given-names>R.</given-names></name>
</person-group> (<year>2013</year>). 
<article-title>Gene duplication as a major force in evolution</article-title>. <source>J. Genet.</source> <volume>92</volume>, <fpage>155</fpage>&#x2013;<lpage>161</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s12041-013-0212-8</pub-id>, PMID: <pub-id pub-id-type="pmid">23640422</pub-id>
</mixed-citation>
</ref>
<ref id="B44">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Manzoor</surname> <given-names>M. A.</given-names></name>
<name><surname>Xu</surname> <given-names>Y.</given-names></name>
<name><surname>Lv</surname> <given-names>Z.</given-names></name>
<name><surname>Xu</surname> <given-names>J.</given-names></name>
<name><surname>Wang</surname> <given-names>Y.</given-names></name>
<name><surname>Sun</surname> <given-names>W.</given-names></name>
<etal/>
</person-group>. (<year>2024</year>). 
<article-title>Comparative genomics of N-acetyl-5-methoxytryptamine members in four Prunus species with insights into bud dormancy and abiotic stress responses in Prunus avium</article-title>. <source>Plant Cell Rep.</source> <volume>43</volume>, <fpage>89</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00299-024-03184-0</pub-id>, PMID: <pub-id pub-id-type="pmid">38462577</pub-id>
</mixed-citation>
</ref>
<ref id="B45">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Mascagni</surname> <given-names>F.</given-names></name>
<name><surname>Usai</surname> <given-names>G.</given-names></name>
<name><surname>Cavallini</surname> <given-names>A.</given-names></name>
<name><surname>Porceddu</surname> <given-names>A</given-names></name>
</person-group>. (<year>2021</year>). 
<article-title>Structural characterization and duplication modes of pseudogenes in plants</article-title>. <source>Sci Rep</source>. <volume>11</volume>(<issue>1</issue>), <elocation-id>5292</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-021-84778-6</pub-id>, PMID: <pub-id pub-id-type="pmid">33674668</pub-id>
</mixed-citation>
</ref>
<ref id="B46">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Melzer</surname> <given-names>R.</given-names></name>
<name><surname>Theissen</surname> <given-names>G.</given-names></name>
</person-group> (<year>2009</year>). 
<article-title>Reconstitution of &#x2018;floral quartets&#x2019; <italic>in vitro</italic> involving class B and class E floral homeotic proteins</article-title>. <source>Nucleic Acids Res.</source> <volume>37</volume>, <fpage>2723</fpage>&#x2013;<lpage>2736</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkp129</pub-id>, PMID: <pub-id pub-id-type="pmid">19276203</pub-id>
</mixed-citation>
</ref>
<ref id="B47">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Mora-Garcia</surname> <given-names>S.</given-names></name>
<name><surname>Goodrich</surname> <given-names>J</given-names></name>
</person-group>. (<year>2000</year>). 
<article-title>Genomic imprinting: Seeds of conflict</article-title>. <source>Current Biol</source>. <volume>10 </volume>(<issue>2</issue>), <fpage>R71</fpage>&#x2013;<lpage>4</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/s0960-9822(00)00285-2</pub-id>, PMID: <pub-id pub-id-type="pmid">10722305</pub-id>
</mixed-citation>
</ref>
<ref id="B48">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Nam</surname> <given-names>J.</given-names></name>
<name><surname>Kim</surname> <given-names>J.</given-names></name>
<name><surname>Lee</surname> <given-names>S.</given-names></name>
<name><surname>An</surname> <given-names>G.</given-names></name>
<name><surname>Ma</surname> <given-names>H.</given-names></name>
<name><surname>Nei</surname> <given-names>M.</given-names></name>
</person-group> (<year>2004</year>). 
<article-title>Type I MADS-box genes have experienced faster birth-and-death evolution than type II MADS-box genes in angiosperms</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>101</volume>, <fpage>1910</fpage>&#x2013;<lpage>1915</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.0308430100</pub-id>, PMID: <pub-id pub-id-type="pmid">14764899</pub-id>
</mixed-citation>
</ref>
<ref id="B49">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ng</surname> <given-names>M.</given-names></name>
<name><surname>Yanofsky</surname> <given-names>M. F.</given-names></name>
</person-group> (<year>2001</year>). 
<article-title>Function and evolution of the plant MADS-box gene family</article-title>. <source>Nat. Rev. Genet.</source> <volume>2</volume>, <fpage>186</fpage>&#x2013;<lpage>195</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/35056041</pub-id>, PMID: <pub-id pub-id-type="pmid">11256070</pub-id>
</mixed-citation>
</ref>
<ref id="B50">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Parenicov&#xe1;</surname> <given-names>L.</given-names></name>
<name><surname>de Folter</surname> <given-names>S.</given-names></name>
<name><surname>Kieffer</surname> <given-names>M.</given-names></name>
<name><surname>Horner</surname> <given-names>D. S.</given-names></name>
<name><surname>Favalli</surname> <given-names>C.</given-names></name>
<name><surname>Busscher</surname> <given-names>J.</given-names></name>
<etal/>
</person-group>. (<year>2003</year>). 
<article-title>Molecular and phylogenetic analyses of the complete MADS-box transcription factor family in Arabidopsis: new openings to the MADS world</article-title>. <source>Plant Cell</source> <volume>15</volume>, <fpage>1538</fpage>&#x2013;<lpage>1551</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1105/tpc.011544</pub-id>, PMID: <pub-id pub-id-type="pmid">12837945</pub-id>
</mixed-citation>
</ref>
<ref id="B51">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Potter</surname> <given-names>S. C.</given-names></name>
<name><surname>Luciani</surname> <given-names>A.</given-names></name>
<name><surname>Eddy</surname> <given-names>S. R.</given-names></name>
<name><surname>Park</surname> <given-names>Y.</given-names></name>
<name><surname>Lopez</surname> <given-names>R.</given-names></name>
<name><surname>Finn</surname> <given-names>R. D.</given-names></name>
</person-group> (<year>2018</year>). 
<article-title>HMMER web server: 2018 update</article-title>. <source>Nucleic Acids Res.</source> <volume>46</volume>, <fpage>W200</fpage>&#x2013;<lpage>w204</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gky448</pub-id>, PMID: <pub-id pub-id-type="pmid">29905871</pub-id>
</mixed-citation>
</ref>
<ref id="B52">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Price</surname> <given-names>M. N.</given-names></name>
<name><surname>Dehal</surname> <given-names>P. S.</given-names></name>
<name><surname>Arkin</surname> <given-names>A. P</given-names></name>
</person-group>. (<year>2009</year>). 
<article-title>FastTree: computing large minimum evolution trees with profiles instead of a distance matrix</article-title>. <source>Mol. Biol. Evol</source>. <volume>26</volume>(<issue>7</issue>), <fpage>1641</fpage>&#x2013;<lpage>1650</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msp077</pub-id>, PMID: <pub-id pub-id-type="pmid">19377059</pub-id>
</mixed-citation>
</ref>
<ref id="B53">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Qian</surname> <given-names>W.</given-names></name>
<name><surname>Zhang</surname> <given-names>J.</given-names></name>
</person-group> (<year>2014</year>). 
<article-title>Genomic evidence for adaptation by gene duplication</article-title>. <source>Genome Res.</source> <volume>24</volume>, <fpage>1356</fpage>&#x2013;<lpage>1362</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/gr.172098.114</pub-id>, PMID: <pub-id pub-id-type="pmid">24904045</pub-id>
</mixed-citation>
</ref>
<ref id="B54">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Qiao</surname> <given-names>X.</given-names></name>
<name><surname>Li</surname> <given-names>Q.</given-names></name>
<name><surname>Yin</surname> <given-names>H.</given-names></name>
<name><surname>Qi</surname> <given-names>K.</given-names></name>
<name><surname>Li</surname> <given-names>L.</given-names></name>
<name><surname>Wang</surname> <given-names>R.</given-names></name>
<etal/>
</person-group>. (<year>2019</year>). 
<article-title>Gene duplication and evolution in recurring polyploidization-diploidization cycles in plants</article-title>. <source>Genome Biol.</source> <volume>20</volume>, <fpage>38</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13059-019-1650-2</pub-id>, PMID: <pub-id pub-id-type="pmid">30791939</pub-id>
</mixed-citation>
</ref>
<ref id="B55">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Quesada-Traver</surname> <given-names>C.</given-names></name>
<name><surname>Lloret</surname> <given-names>A.</given-names></name>
<name><surname>Carretero-Paulet</surname> <given-names>L.</given-names></name>
<name><surname>Badenes</surname> <given-names>M. L.</given-names></name>
<name><surname>Rios</surname> <given-names>G.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>Evolutionary origin and functional specialization of Dormancy-Associated MADS box (DAM) proteins in perennial crops</article-title>. <source>BMC Plant Biol.</source> <volume>22</volume>, <fpage>473</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12870-022-03856-7</pub-id>, PMID: <pub-id pub-id-type="pmid">36199018</pub-id>
</mixed-citation>
</ref>
<ref id="B56">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ren</surname> <given-names>R.</given-names></name>
<name><surname>Wang</surname> <given-names>H.</given-names></name>
<name><surname>Guo</surname> <given-names>C.</given-names></name>
<name><surname>Zhang</surname> <given-names>N.</given-names></name>
<name><surname>Zeng</surname> <given-names>L.</given-names></name>
<name><surname>Chen</surname> <given-names>Y.</given-names></name>
<etal/>
</person-group>. (<year>2018</year>). 
<article-title>Widespread whole genome duplications contribute to genome complexity and species diversity in angiosperms</article-title>. <source>Mol. Plant</source> <volume>11</volume>, <fpage>414</fpage>&#x2013;<lpage>428</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.molp.2018.01.002</pub-id>, PMID: <pub-id pub-id-type="pmid">29317285</pub-id>
</mixed-citation>
</ref>
<ref id="B57">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Shen</surname> <given-names>G.</given-names></name>
<name><surname>Jia</surname> <given-names>Y.</given-names></name>
<name><surname>Wang</surname> <given-names>W. L.</given-names></name>
</person-group> (<year>2021</year>). 
<article-title>Evolutionary divergence of motifs in B-class MADS-box proteins of seed plants</article-title>. <source>J. Biol. Res. (Thessalon)</source> <volume>28</volume>, <fpage>12</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s40709-021-00144-7</pub-id>, PMID: <pub-id pub-id-type="pmid">34049600</pub-id>
</mixed-citation>
</ref>
<ref id="B58">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Sheng</surname> <given-names>X. G.</given-names></name>
<name><surname>Zhao</surname> <given-names>Z. Q.</given-names></name>
<name><surname>Wang</surname> <given-names>J. S.</given-names></name>
<name><surname>Yu</surname> <given-names>H. F.</given-names></name>
<name><surname>Shen</surname> <given-names>Y. S.</given-names></name>
<name><surname>Zeng</surname> <given-names>X. Y.</given-names></name>
<etal/>
</person-group>. (<year>2019</year>). 
<article-title>Genome wide analysis of MADS-box gene family in Brassica oleracea reveals conservation and variation in flower development</article-title>. <source>BMC Plant Biol.</source> <volume>19</volume>, <fpage>106</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12870-019-1717-y</pub-id>, PMID: <pub-id pub-id-type="pmid">30890145</pub-id>
</mixed-citation>
</ref>
<ref id="B59">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Shi</surname> <given-names>X.</given-names></name>
<name><surname>Chen</surname> <given-names>C.</given-names></name>
<name><surname>Yang</surname> <given-names>H.</given-names></name>
<name><surname>Hou</surname> <given-names>J.</given-names></name>
<name><surname>Ji</surname> <given-names>T.</given-names></name>
<name><surname>Cheng</surname> <given-names>J.</given-names></name>
<etal/>
</person-group>. (<year>2020</year>). 
<article-title>The gene balance hypothesis: epigenetics and dosage effects in plants</article-title>. <source>Methods Mol. Biol.</source>, <volume>2093</volume>, <fpage>161</fpage>&#x2013;<lpage>171</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-1-0716-0179-2_12</pub-id>, PMID: <pub-id pub-id-type="pmid">32088896</pub-id>
</mixed-citation>
</ref>
<ref id="B60">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Shimizu</surname> <given-names>K. K.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>Robustness and the generalist niche of polyploid species: Genome shock or gradual evolution</article-title>? <source>Curr. Opin. Plant Biol.</source> <volume>69</volume>, <elocation-id>102292</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.pbi.2022.102292</pub-id>, PMID: <pub-id pub-id-type="pmid">36063635</pub-id>
</mixed-citation>
</ref>
<ref id="B61">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Shu</surname> <given-names>Y.</given-names></name>
<name><surname>Yu</surname> <given-names>D.</given-names></name>
<name><surname>Wang</surname> <given-names>D.</given-names></name>
<name><surname>Guo</surname> <given-names>D.</given-names></name>
<name><surname>Guo</surname> <given-names>C.</given-names></name>
</person-group> (<year>2013</year>). 
<article-title>Genome-wide survey and expression analysis of the MADS-box gene family in soybean</article-title>. <source>Mol. Biol. Rep.</source> <volume>40</volume>, <fpage>3901</fpage>&#x2013;<lpage>3911</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11033-012-2438-6</pub-id>, PMID: <pub-id pub-id-type="pmid">23559340</pub-id>
</mixed-citation>
</ref>
<ref id="B62">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Soltis</surname> <given-names>P. S.</given-names></name>
<name><surname>Marchant</surname> <given-names>D. B.</given-names></name>
<name><surname>Van de Peer</surname> <given-names>Y.</given-names></name>
<name><surname>Soltis</surname> <given-names>D. E.</given-names></name>
</person-group> (<year>2015</year>). 
<article-title>Polyploidy and genome evolution in plants</article-title>. <source>Curr. Opin. Genet. Dev.</source> <volume>35</volume>, <fpage>119</fpage>&#x2013;<lpage>125</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.gde.2015.11.003</pub-id>, PMID: <pub-id pub-id-type="pmid">26656231</pub-id>
</mixed-citation>
</ref>
<ref id="B63">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Subramanian</surname> <given-names>B.</given-names></name>
<name><surname>Gao</surname> <given-names>S.</given-names></name>
<name><surname>Lercher</surname> <given-names>M. J.</given-names></name>
<name><surname>Hu</surname> <given-names>S.</given-names></name>
<name><surname>Chen</surname> <given-names>W. H.</given-names></name>
</person-group> (<year>2019</year>). 
<article-title>Evolview v3: a webserver for visualization, annotation, and management of phylogenetic trees</article-title>. <source>Nucleic Acids Res.</source> <volume>47</volume>, <fpage>W270</fpage>&#x2013;<lpage>w275</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkz357</pub-id>, PMID: <pub-id pub-id-type="pmid">31114888</pub-id>
</mixed-citation>
</ref>
<ref id="B64">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Thangavel</surname> <given-names>G.</given-names></name>
<name><surname>Nayar</surname> <given-names>S.</given-names></name>
</person-group> (<year>2018</year>). 
<article-title>A survey of MIKC type MADS-box genes in non-seed plants: algae, bryophytes, lycophytes and ferns</article-title>. <source>Front. Plant Sci.</source> <volume>9</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2018.00510</pub-id>, PMID: <pub-id pub-id-type="pmid">29720991</pub-id>
</mixed-citation>
</ref>
<ref id="B65">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Tong</surname> <given-names>C.</given-names></name>
<name><surname>Jia</surname> <given-names>Y.</given-names></name>
<name><surname>Hu</surname> <given-names>H.</given-names></name>
<name><surname>Zeng</surname> <given-names>Z.</given-names></name>
<name><surname>Chapman</surname> <given-names>B.</given-names></name>
<name><surname>Li</surname> <given-names>C.</given-names></name>
</person-group> (<year>2025</year>). 
<article-title>Pangenome and pantranscriptome as the new reference for gene-family characterization: A case study of basic helix-loop-helix (bHLH) genes in barley</article-title>. <source>Plant Commun.</source> <volume>6</volume>, <elocation-id>101190</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.xplc.2024.101190</pub-id>, PMID: <pub-id pub-id-type="pmid">39521956</pub-id>
</mixed-citation>
</ref>
<ref id="B66">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Vanneste</surname> <given-names>K.</given-names></name>
<name><surname>Maere</surname> <given-names>S.</given-names></name>
<name><surname>Van de Peer</surname> <given-names>Y.</given-names></name>
</person-group> (<year>2014</year>). 
<article-title>Tangled up in two: a burst of genome duplications at the end of the Cretaceous and the consequences for plant evolution</article-title>. <source>Philos. Trans. R Soc. Lond B Biol. Sci.</source> <volume>369</volume>, <fpage>20130353</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1098/rstb.2013.0353</pub-id>, PMID: <pub-id pub-id-type="pmid">24958926</pub-id>
</mixed-citation>
</ref>
<ref id="B67">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>Y.</given-names></name>
<name><surname>Tang</surname> <given-names>H.</given-names></name>
<name><surname>Debarry</surname> <given-names>J. D.</given-names></name>
<name><surname>Tan</surname> <given-names>X.</given-names></name>
<name><surname>Li</surname> <given-names>J.</given-names></name>
<name><surname>Wang</surname> <given-names>X.</given-names></name>
<etal/>
</person-group>. (<year>2012</year>). 
<article-title>MCScanX: a toolkit for detection and evolutionary analysis of gene synteny and collinearity</article-title>. <source>Nucleic Acids Res.</source> <volume>40</volume>, <fpage>e49</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkr1293</pub-id>, PMID: <pub-id pub-id-type="pmid">22217600</pub-id>
</mixed-citation>
</ref>
<ref id="B68">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wei</surname> <given-names>J.</given-names></name>
<name><surname>Zhang</surname> <given-names>G.</given-names></name>
<name><surname>Lv</surname> <given-names>H.</given-names></name>
<name><surname>Wang</surname> <given-names>S.</given-names></name>
<name><surname>Liu</surname> <given-names>X.</given-names></name>
<name><surname>Qi</surname> <given-names>Y.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>Genome-wide identification of the P4ATPase gene family and its response to biotic and abiotic stress in soybean (Glycine max L.)</article-title>. <source>BMC Genomics</source> <volume>26</volume>, <fpage>277</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12864-025-11468-2</pub-id>, PMID: <pub-id pub-id-type="pmid">40114086</pub-id>
</mixed-citation>
</ref>
<ref id="B69">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wilson</surname> <given-names>A. E.</given-names></name>
<name><surname>Liberles</surname> <given-names>D. A.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>Expectations of duplicate gene retention under the gene duplicability hypothesis</article-title>. <source>BMC Ecol. Evol.</source> <volume>23</volume>, <fpage>76</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12862-023-02174-2</pub-id>, PMID: <pub-id pub-id-type="pmid">38097959</pub-id>
</mixed-citation>
</ref>
<ref id="B70">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Xue</surname> <given-names>C.</given-names></name>
<name><surname>Fu</surname> <given-names>Y.</given-names></name>
</person-group> (<year>2009</year>). 
<article-title>Preservation of duplicate genes by originalization</article-title>. <source>Genetica</source> <volume>136</volume>, <fpage>69</fpage>&#x2013;<lpage>78</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10709-008-9311-5</pub-id>, PMID: <pub-id pub-id-type="pmid">18726163</pub-id>
</mixed-citation>
</ref>
<ref id="B71">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ye</surname> <given-names>L. X.</given-names></name>
<name><surname>Zhang</surname> <given-names>J. X.</given-names></name>
<name><surname>Hou</surname> <given-names>X. J.</given-names></name>
<name><surname>Qiu</surname> <given-names>M. Q.</given-names></name>
<name><surname>Wang</surname> <given-names>W. F.</given-names></name>
<name><surname>Zhang</surname> <given-names>J. X.</given-names></name>
<etal/>
</person-group>. (<year>2021</year>). 
<article-title>A MADS-box gene ciMADS43 is involved in citrus flowering and leaf development through interaction with ciAGL9</article-title>. <source>Int. J. Mol. Sci.</source> <volume>22</volume>, <fpage>5205</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/ijms22105205</pub-id>, PMID: <pub-id pub-id-type="pmid">34069068</pub-id>
</mixed-citation>
</ref>
<ref id="B72">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Yu</surname> <given-names>Z.</given-names></name>
<name><surname>Lei</surname> <given-names>T.</given-names></name>
<name><surname>Yi</surname> <given-names>X.</given-names></name>
<name><surname>Hao</surname> <given-names>Y.</given-names></name>
<name><surname>Wu</surname> <given-names>S.</given-names></name>
<name><surname>Xiao</surname> <given-names>Z.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>LGRPv2: A high-value platform for the advancement of Fabaceae genomics</article-title>. <source>Plant Biotechnol. J</source>. <volume>23</volume>, <fpage>4057</fpage>&#x2013;<lpage>4075</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/pbi.70220</pub-id>, PMID: <pub-id pub-id-type="pmid">40545607</pub-id>
</mixed-citation>
</ref>
<ref id="B73">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Yu</surname> <given-names>Y.</given-names></name>
<name><surname>Zhang</surname> <given-names>H.</given-names></name>
<name><surname>Long</surname> <given-names>Y.</given-names></name>
<name><surname>Shu</surname> <given-names>Y.</given-names></name>
<name><surname>Zhai</surname> <given-names>J.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>Plant Public RNA-seq Database: a comprehensive online database for expression analysis of ~45&#x2013;000 plant public RNA-Seq libraries</article-title>. <source>Plant Biotechnol. J.</source> <volume>20</volume>, <fpage>806</fpage>&#x2013;<lpage>808</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/pbi.13798</pub-id>, PMID: <pub-id pub-id-type="pmid">35218297</pub-id>
</mixed-citation>
</ref>
<ref id="B74">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhang</surname> <given-names>L.</given-names></name>
<name><surname>Chen</surname> <given-names>F.</given-names></name>
<name><surname>Zhang</surname> <given-names>X.</given-names></name>
<name><surname>Li</surname> <given-names>Z.</given-names></name>
<name><surname>Zhao</surname> <given-names>Y.</given-names></name>
<name><surname>Lohaus</surname> <given-names>R.</given-names></name>
<etal/>
</person-group>. (<year>2020</year>). 
<article-title>The water lily genome and the early evolution of flowering plants</article-title>. <source>Nature</source> <volume>577</volume>, <fpage>79</fpage>&#x2013;<lpage>84</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41586-019-1852-5</pub-id>, PMID: <pub-id pub-id-type="pmid">31853069</pub-id>
</mixed-citation>
</ref>
<ref id="B75">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhao</surname> <given-names>D.</given-names></name>
<name><surname>Chen</surname> <given-names>Z.</given-names></name>
<name><surname>Xu</surname> <given-names>L.</given-names></name>
<name><surname>Zhang</surname> <given-names>L.</given-names></name>
<name><surname>Zou</surname> <given-names>Q.</given-names></name>
</person-group> (<year>2021</year>a). 
<article-title>Genome-wide analysis of the MADS-box gene family in maize: gene structure, evolution, and relationships</article-title>. <source>Genes (Basel)</source> <volume>12</volume>, <fpage>1956</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/genes12121956</pub-id>, PMID: <pub-id pub-id-type="pmid">34946905</pub-id>
</mixed-citation>
</ref>
<ref id="B76">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhao</surname> <given-names>N.</given-names></name>
<name><surname>Ding</surname> <given-names>X.</given-names></name>
<name><surname>Lian</surname> <given-names>T.</given-names></name>
<name><surname>Wang</surname> <given-names>M.</given-names></name>
<name><surname>Tong</surname> <given-names>Y.</given-names></name>
<name><surname>Liang</surname> <given-names>D.</given-names></name>
<etal/>
</person-group>. (<year>2020</year>). 
<article-title>The effects of gene duplication modes on the evolution of regulatory divergence in wild and cultivated soybean</article-title>. <source>Front. Genet.</source> <volume>11</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fgene.2020.601003</pub-id>, PMID: <pub-id pub-id-type="pmid">33363574</pub-id>
</mixed-citation>
</ref>
<ref id="B77">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhao</surname> <given-names>J.</given-names></name>
<name><surname>Teufel</surname> <given-names>A. I.</given-names></name>
<name><surname>Liberles</surname> <given-names>D. A.</given-names></name>
<name><surname>Liu</surname> <given-names>L.</given-names></name>
</person-group> (<year>2015</year>). 
<article-title>A generalized birth and death process for modeling the fates of gene duplication</article-title>. <source>BMC Evol. Biol.</source> <volume>15</volume>, <fpage>275</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12862-015-0539-2</pub-id>, PMID: <pub-id pub-id-type="pmid">26643106</pub-id>
</mixed-citation>
</ref>
<ref id="B78">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhao</surname> <given-names>Y.</given-names></name>
<name><surname>Zhang</surname> <given-names>R.</given-names></name>
<name><surname>Jiang</surname> <given-names>K.-W.</given-names></name>
<name><surname>Qi</surname> <given-names>J.</given-names></name>
<name><surname>Hu</surname> <given-names>Y.</given-names></name>
<name><surname>Guo</surname> <given-names>J.</given-names></name>
<etal/>
</person-group>. (<year>2021</year>b). 
<article-title>Nuclear phylotranscriptomics and phylogenomics support numerous polyploidization events and hypotheses for the evolution of rhizobial nitrogen-fixing symbiosis in Fabaceae</article-title>. <source>Mol. Plant</source> <volume>14</volume>, <fpage>748</fpage>&#x2013;<lpage>773</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.molp.2021.02.006</pub-id>, PMID: <pub-id pub-id-type="pmid">33631421</pub-id>
</mixed-citation>
</ref>
<ref id="B79">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhu</surname> <given-names>Y.</given-names></name>
<name><surname>Lin</surname> <given-names>Z.</given-names></name>
<name><surname>Nakhleh</surname> <given-names>L.</given-names></name>
</person-group> (<year>2013</year>). 
<article-title>Evolution after whole-genome duplication: a network perspective</article-title>. <source>G3 (Bethesda)</source> <volume>3</volume>, <fpage>2049</fpage>&#x2013;<lpage>2057</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1534/g3.113.008458</pub-id>, PMID: <pub-id pub-id-type="pmid">24048644</pub-id>
</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn id="n1" fn-type="custom" custom-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/653566">Xuming Li</ext-link>, Hugo Biotechnologies Co., Ltd., China</p></fn>
<fn id="n2" fn-type="custom" custom-type="reviewed-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1990470">Hong Zhai</ext-link>, Chinese Academy of Sciences (CAS), China</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3271471">Tiantian Bu</ext-link>, Henan University, China</p></fn>
</fn-group>
</back>
</article>