<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2023.1198909</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Phylogenomic analysis provides insights into <italic>MADS-box</italic> and <italic>TCP</italic> gene diversification and floral development of the Asteraceae, supported by <italic>de novo</italic> genome and transcriptome sequences from dandelion (<italic>Taraxacum officinale</italic>)</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Xiong</surname>
<given-names>Wei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn004">
<sup>&#x2021;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2269081"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Risse</surname>
<given-names>Judith</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="author-notes" rid="fn004">
<sup>&#x2021;</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Berke</surname>
<given-names>Lidija</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhao</surname>
<given-names>Tao</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1794929"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>van de Geest</surname>
<given-names>Henri</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Oplaat</surname>
<given-names>Carla</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Busscher</surname>
<given-names>Marco</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ferreira de Carvalho</surname>
<given-names>Julie</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>van der Meer</surname>
<given-names>Ingrid M.</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/197629"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Verhoeven</surname>
<given-names>Koen J. F.</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/43165"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Schranz</surname>
<given-names>M. Eric</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<xref ref-type="author-notes" rid="fn005">
<sup>&#xa7;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/190885"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Vijverberg</surname>
<given-names>Kitty</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<xref ref-type="author-notes" rid="fn005">
<sup>&#xa7;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/588224"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Biosystematics Group, Wageningen University and Research</institution>, <addr-line>Wageningen</addr-line>, <country>Netherlands</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Bioinformatics Group, Wageningen University and Research</institution>, <addr-line>Wageningen</addr-line>, <country>Netherlands</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Department of Terrestrial Ecology, Netherlands Institute of Ecology (NIOO-KNAW)</institution>, <addr-line>Wageningen</addr-line>, <country>Netherlands</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Bioscience, Wageningen University and Research</institution>, <addr-line>Wageningen</addr-line>, <country>Netherlands</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Stefan de Folter, Center for Research and Advanced Studies (CINVESTAV), Mexico</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Zhichao Xu, Northeast Forestry University, China; Qing Ma, Zhejiang Shuren University, China</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Kitty Vijverberg, <email xlink:href="mailto:mail@kittyvijverberg.nl">mail@kittyvijverberg.nl</email>;  M. Eric Schranz, <email xlink:href="mailto:eric.schranz@wur.nl">eric.schranz@wur.nl</email>
</p>
</fn>
<fn fn-type="present-address" id="fn003">
<p>&#x2020;Present address: Lidija Berke, Bioinformatics &amp; Software Development, Genetwister Technologies B.V., Wageningen, Netherlands; Tao Zhao, State Key Laboratory of Crop Stress Biology for Arid Areas, Northwest A&amp;F University, Yangling, Shaanxi, China; Henri van de Geest, Hudson River Biotechnology, Wageningen, Netherlands; Carla Oplaat, Netherlands Institute for Vectors, Invasive Plants and Plant Health (NIVIP) Netherlands Food and Consumer Product Safety Authority (NVWA), Wageningen, Netherlands; Julie Ferreira de Carvalho, Institute of Research in Horticulture and Seeds (IRHS), University of Angers/French National Research Institute for Agriculture, Food and Environment (INRAE)/Agro Institute, Angers, France; Kitty Vijverberg, Plant Trait Biology, Rijk Zwaan Breeding BV, Fijnaart, Netherlands</p>
</fn>
<fn fn-type="other" id="fn004">
<p>&#x2021;These authors share first authorship</p>
</fn>
<fn fn-type="other" id="fn005">
<p>&#xa7;These authors share last authorship</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>21</day>
<month>06</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>14</volume>
<elocation-id>1198909</elocation-id>
<history>
<date date-type="received">
<day>02</day>
<month>04</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>26</day>
<month>05</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2023 Xiong, Risse, Berke, Zhao, van de Geest, Oplaat, Busscher, Ferreira de Carvalho, van der Meer, Verhoeven, Schranz and Vijverberg</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Xiong, Risse, Berke, Zhao, van de Geest, Oplaat, Busscher, Ferreira de Carvalho, van der Meer, Verhoeven, Schranz and Vijverberg</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>The Asteraceae is the largest angiosperm family with more than 25,000 species. Individual studies have shown that <italic>MADS-box</italic> and <italic>TCP</italic> transcription factors are regulators of the development and symmetry of flowers, contributing to their iconic flower-head (capitulum) and floret. However, a systematic study of <italic>MADS-box</italic> and <italic>TCP</italic> genes across the Asteraceae is lacking. We performed a comparative analysis of genome sequences of 33 angiosperm species including our <italic>de novo</italic> assembly of diploid sexual dandelion (<italic>Taraxacum officinale</italic>) and 11 other Asteraceae to investigate the lineage-specific evolution of <italic>MADS-box</italic> and <italic>TCP</italic> genes in the Asteraceae. We compared the phylogenomic results of <italic>MADS-box</italic> and <italic>TCP</italic> genes with their expression in <italic>T. officinale</italic> floral tissues at different developmental stages to demonstrate the regulation of genes with Asteraceae-specific attributes. Here, we show that <italic>MADS-box MIKC</italic>
<sup>c</sup> and <italic>TCP-CYCLOIDEA</italic> (<italic>CYC</italic>) genes have expanded in the Asteraceae. The phylogenomic analysis identified <italic>AGAMOUS</italic>-like (<italic>AG</italic>-like: <italic>SEEDSTICK</italic> [<italic>STK</italic>]-like), <italic>SEPALATA</italic>-like (<italic>SEP</italic>3-like), and <italic>TCP-PROLIFERATING CELL FACTOR</italic> (<italic>PCF</italic>)-like copies with lineage-specific genomic contexts in the Asteraceae, Cichorioideae, or dandelion. Different expression patterns of some of these gene copies suggest functional divergence. We also confirm the presence and revisit the evolutionary history of previously named &#x201c;<italic>Asteraceae-Specific MADS-box</italic> genes (<italic>AS-MADS</italic>).&#x201d; Specifically, we identify non-Asteraceae homologs, indicating a more ancient origin of this gene clade. Syntenic relationships support that <italic>AS-MADS</italic> is paralogous to <italic>FLOWERING LOCUS C</italic> (<italic>FLC</italic>) as demonstrated by the shared ancient duplication of <italic>FLC</italic> and <italic>SEP</italic>3.</p>
</abstract>
<kwd-group>
<kwd>Asteraceae</kwd>
<kwd>dandelion</kwd>
<kwd>
<italic>de novo</italic> sequencing</kwd>
<kwd>floral development</kwd>
<kwd>
<italic>MADS-box</italic> gene</kwd>
<kwd>phylogenomics</kwd>
<kwd>
<italic>TCP</italic> gene</kwd>
</kwd-group>
<counts>
<fig-count count="5"/>
<table-count count="1"/>
<equation-count count="0"/>
<ref-count count="107"/>
<page-count count="20"/>
<word-count count="13188"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Plant Development and EvoDevo</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>The Asteraceae (Compositae) is the largest and most diverse families of angiosperms, with great ecological and economic importance. It contains ~25,000 species, which represents 10% of extant flowering plants (<xref ref-type="bibr" rid="B53">Mandel et&#xa0;al., 2019</xref>). The Asteraceae is subdivided into 16 subfamilies including two large crown-groups, the Asteroideae (e.g., sunflower and daisy) and Cichorioideae (e.g., lettuce and dandelion) (<xref ref-type="bibr" rid="B14">Chase et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B82">Stevens, 2017</xref>; <xref ref-type="bibr" rid="B84">Susanna et&#xa0;al., 2020</xref>). Members of the Asteraceae inhabit an incredible range of ecosystems varying in climates and landscapes on every continent (<xref ref-type="bibr" rid="B80">Smith and Richardson, 2010</xref>; <xref ref-type="bibr" rid="B27">Folk et&#xa0;al., 2020</xref>). Their global distribution makes them interesting targets to study various questions in ecology and evolution (<xref ref-type="bibr" rid="B77">Shen et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B63">Palazzesi et&#xa0;al., 2022</xref>). For humans, the Asteraceae is of considerable societal and economic value as ornamentals (e.g., <italic>Gerbera</italic> and <italic>Chrysanthemum</italic>), medicines (e.g., sweet wormwood and chamomile), and crops (e.g., sunflower and lettuce), including many well-known weedy species (e.g., groundsel and dandelion). Genome assemblies can facilitate the study of the molecular and evolutionary bases of ecological and economic traits. To date, most sequenced Asteraceae species are ornamentals and crops.</p>
<p>The unique floral and fruit traits of the Asteraceae, including the representative flower heads (capitula) and one-seeded dry fruits (cypsela) often with a hairy or scaly pappus, underlie much of the diversity and evolutionary and ecological success of the group (<xref ref-type="bibr" rid="B65">Panero and Funk, 2008</xref>; <xref ref-type="bibr" rid="B53">Mandel et&#xa0;al., 2019</xref>). The capitulum is one of the most iconic floral features of the Asteraceae, a highly compressed inflorescence with many closely packed flowers, named &#x201c;florets&#x201d;, that together resemble a flower (<xref ref-type="bibr" rid="B24">Elomaa et&#xa0;al., 2018</xref>). There are three major floret types in Asteraceae&#x2014;disc (tube), ray (two- three-lobed), and ligulate (five-lobed) (<xref ref-type="bibr" rid="B2">Anderberg et&#xa0;al., 2007</xref>)&#x2014;which are discriminatory to the subfamilies, particularly the Asteroideae, characterized by disc florets &#xb1; one or more rows of ray florets, and the Cichorioideae, characterized by ligulate florets (<xref ref-type="bibr" rid="B11">Carlquist, 1976</xref>). In addition, the pappus, a highly modified calyx (<xref ref-type="bibr" rid="B99">Vijverberg et&#xa0;al., 2021</xref>), is another striking characteristic of the Asteraceae. It assists in seed dispersal and can protect against herbivores and aid in water uptake to facilitate germination (<xref ref-type="bibr" rid="B11">Carlquist, 1976</xref>; <xref ref-type="bibr" rid="B83">Stuessy and Garver, 1996</xref>; <xref ref-type="bibr" rid="B35">Jana and Mukherjee, 2012</xref>). Understanding the genetic basis of capitulum formation and floral and fruit characteristics is, therefore, of large interest to understanding the evolutionary success of the Asteraceae.</p>
<p>Whole-genome duplications (WGDs) have likely played a critical role in boosting the diversity of the Asteraceae (<xref ref-type="bibr" rid="B3">Barker et&#xa0;al., 2008</xref>), similar to other angiosperm lineages (<xref ref-type="bibr" rid="B62">Ohno, 1970</xref>; <xref ref-type="bibr" rid="B17">De Bodt et&#xa0;al., 2005</xref>; <xref ref-type="bibr" rid="B52">Magadum et&#xa0;al., 2013</xref>). In the Asteraceae, two paleopolyploid events occurred preceding their major radiation (<xref ref-type="bibr" rid="B4">Barker et&#xa0;al., 2016</xref>), and more recent WGDs occurred in major tribes and subfamilies (<xref ref-type="bibr" rid="B32">Huang et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B77">Shen et&#xa0;al., 2021</xref>). After WGDs, the additional gene copies may retain their original function (redundant copies) or undergo sub- and/or neo-functionalization (<xref ref-type="bibr" rid="B64">Panchy et&#xa0;al., 2016</xref>). Moreover, genes in a new genomic context (i.e., gene transposition) may result in a novel (<italic>cis</italic>) gene regulation (<xref ref-type="bibr" rid="B33">Ilic et&#xa0;al., 2003</xref>; <xref ref-type="bibr" rid="B43">Langham et&#xa0;al., 2004</xref>; <xref ref-type="bibr" rid="B49">Lockton and Gaut, 2005</xref>). Among the most important regulators of floral organ determination and development are the <italic>MADS-box</italic> and <italic>TCP</italic> transcription factors. Polyploidization has resulted in expanded <italic>MADS-box</italic> and <italic>TCP</italic> gene families. These expansions have been shown to contribute to the evolution of the capitulum, floral and fruit characteristics in the Asteraceae in different studies (see below).</p>
<p>In this study, we further examine <italic>MADS-box</italic> and <italic>TCP</italic> gene families to study their evolution, genomic context, and expression. The <italic>MADS-box</italic> gene family consists of two major clades: Type I and Type II. Type I genes have a conserved N-terminal MADS DNA binding domain (M). Type II genes contain an M-domain, a less conserved Intervening domain (I), a conserved Keratin-like coiled-coil domain (K-box), and a highly variable, often species-specific, C-terminal domain (<xref ref-type="bibr" rid="B88">Thei&#xdf;en et&#xa0;al., 1996</xref>; <xref ref-type="bibr" rid="B1">Alvarez-Buylla et&#xa0;al., 2000</xref>; <xref ref-type="bibr" rid="B78">Smaczniak et&#xa0;al., 2012</xref>). Type II <italic>MADS-box</italic> genes are also known as <italic>MIKC</italic> genes and can be further subdivided into <italic>MIKC</italic>
<sup>c</sup> and <italic>MIKC</italic>* types (<xref ref-type="bibr" rid="B31">Henschel et&#xa0;al., 2002</xref>). <italic>MIKC</italic>
<sup>c</sup> genes comprise several sub-groups including the well-known ABC(D)E genes crucial for floral organ determination and development (<xref ref-type="bibr" rid="B5">Becker and Thei&#xdf;en, 2003</xref>; <xref ref-type="bibr" rid="B89">Thei&#xdf;en et&#xa0;al., 2016</xref>). Research results on Asteraceae floral development particularly come from the classical model <italic>Gerbera</italic> (Mutisioideae; <xref ref-type="bibr" rid="B104">Zhang et&#xa0;al., 2017</xref>) and more recently from crops such as lettuce (Cichorioideae; <xref ref-type="bibr" rid="B61">Ning et&#xa0;al., 2019</xref>), sunflower (Asteroideae; <xref ref-type="bibr" rid="B19">Dezar, 2003</xref>), and chrysanthemum (Asteroideae; <xref ref-type="bibr" rid="B102">Won et&#xa0;al., 2021</xref>). For example, in <italic>Gerbera</italic>, a total of eight <italic>SEPALLATA</italic>-like (<italic>SEP</italic>-like; class E) genes were found (<xref ref-type="bibr" rid="B104">Zhang et&#xa0;al., 2017</xref>), whereas <italic>Arabidopsis</italic> has only four <italic>SEP</italic>-like genes. Unlike the redundancy of <italic>SEP</italic> copies in <italic>Arabidopsis</italic>, the different <italic>SEP</italic>-like genes in <italic>Gerbera</italic> show sub-functionalization in floral organ development and neo-functionalization in the inflorescence meristem in addition to conserved functions (<xref ref-type="bibr" rid="B24">Elomaa et&#xa0;al., 2018</xref>). Genome-wide analysis of <italic>MADS-box</italic> genes in <italic>Chrysanthemum</italic> and lettuce identified a putative <italic>Asteraceae-specific MADS-box</italic> (AS-MADS) clade, genes of which the evolution and function are still unclear (<xref ref-type="bibr" rid="B102">Won et&#xa0;al., 2021</xref>).</p>
<p>All <italic>TCP</italic> genes contain a highly conserved <italic>basic HELIX LOOP HELIX</italic> (<italic>bHLH</italic>) domain by which they are divided into Class I (P) and Class II (C) (<xref ref-type="bibr" rid="B39">Kosugi and Ohashi, 1997</xref>; <xref ref-type="bibr" rid="B59">Navaud et&#xa0;al., 2007</xref>; <xref ref-type="bibr" rid="B46">Li, 2015</xref>). Class I <italic>TCP</italic> genes represent the <italic>PROLIFERATING CELL FACTOR</italic> (<italic>PCF</italic>) genes, while class II <italic>TCP</italic> genes are divided into the ubiquitous <italic>CINCINNATA</italic> (<italic>CIN</italic>) genes and angiosperm-specific <italic>CYCLOIDEA/TEOSINTE BRANCHED1</italic> (<italic>CYC/TB</italic>1) genes (<xref ref-type="bibr" rid="B51">Luo et&#xa0;al., 1996</xref>; <xref ref-type="bibr" rid="B21">Doebley et&#xa0;al., 1997</xref>; <xref ref-type="bibr" rid="B58">Nath et&#xa0;al., 2003</xref>; <xref ref-type="bibr" rid="B55">Mart&#xed;n-Trillo and Cubas, 2010</xref>). Among them, <italic>CYC/TB1</italic> genes are closely associated with the regulation of flower symmetry (e.g., in <italic>Antirrhinum majus</italic>; <xref ref-type="bibr" rid="B51">Luo et&#xa0;al., 1996</xref>). Studies of <italic>Senecio</italic> (Asteraceae) showed that the <italic>CYC</italic>2-like genes <italic>RAY</italic>1 and <italic>RAY</italic>2 are involved in the development of ray florets (<xref ref-type="bibr" rid="B37">Kim et&#xa0;al., 2008</xref>). <italic>CYC</italic>2 homologs control various roles in the formation of ray and disc florets in distinct Asteraceae lineages, suggesting neo-functionalization (<xref ref-type="bibr" rid="B24">Elomaa et&#xa0;al., 2018</xref>), and an extensive study found that the developmental program of making a ray flower involves functionally divergent <italic>CYC</italic>2-like genes in different lineages (<xref ref-type="bibr" rid="B15">Chen et&#xa0;al., 2018</xref>). However, the function of <italic>CYC</italic> in the formation of ligulate florets is yet unconfirmed. An understudied group of <italic>TCP</italic> genes is <italic>PCF</italic> genes (<xref ref-type="bibr" rid="B39">Kosugi and Ohashi, 1997</xref>), which participate in a wide range of plant growth, including flower development. The increasing number of sequenced genomes presents us with an opportunity to conduct a systematic analysis of these important <italic>MADS-box</italic> and <italic>TCP</italic> gene families in a wide range of Asteraceae species.</p>
<p>To study the evolution of <italic>MADS-box</italic> and <italic>TCP</italic> gene families in Asteraceae, a plant family-based phylogenomic analysis is required to gain more knowledge about the history of gene retention after Asteraceae radiation-related WGDs. Moreover, the patterns of gene movement (transpositions) could help identify potential sources of regulatory novelty induced by genomic context change. Thus, a broad range of genomic comparisons, like synteny network analysis (<xref ref-type="bibr" rid="B106">Zhao and Schranz, 2017</xref>), is valuable to conduct alongside phylogenetic analysis. Synteny can help determine the orthologous relationships of duplicated genes among species after complex WGDs and identify other genomic positional changes, like ancient tandem duplications and gene transpositions (<xref ref-type="bibr" rid="B18">Dewey, 2011</xref>; <xref ref-type="bibr" rid="B105">Zhao et&#xa0;al., 2017</xref>).</p>
<p>In this study, we used the common dandelion (<italic>Taraxacum officinale</italic>; <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>), a member of the Cichorioideae and taxonomic outgroup of lettuce, as a model. Dandelion is well-studied because of its two reproduction modes that co-occur within its distribution range: sexual diploids (2<italic>n</italic> = 2<italic>x</italic> = 16) and asexual, apomict, triploids (2<italic>n</italic> = 3<italic>x</italic> = 24) (<xref ref-type="bibr" rid="B92">Van Dijk et&#xa0;al., 1999</xref>), for example, to study the molecular genetic basis of apomixis elements including diplospory (<xref ref-type="bibr" rid="B98">Vijverberg et&#xa0;al., 2004</xref>; <xref ref-type="bibr" rid="B96">Vijverberg et&#xa0;al., 2010</xref>) and parthenogenesis (<xref ref-type="bibr" rid="B97">Vijverberg et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B91">Van Dijk et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B90">Underwood et&#xa0;al., 2022</xref>). Dandelion has been investigated for its ecological evolution and adaption (<xref ref-type="bibr" rid="B6">Brock et&#xa0;al., 2005</xref>; <xref ref-type="bibr" rid="B95">Verhoeven et&#xa0;al., 2018</xref>) and more recently for its aforementioned floret and fruit characteristics (<xref ref-type="bibr" rid="B99">Vijverberg et&#xa0;al., 2021</xref>). A genome assembly of this interesting model species will provide insights into its gene and genome evolution and serve as an important reference for comparative analysis within the Asteraceae, other <italic>Taraxacum</italic> species and genotypes, and related species such as lettuce, and for gene analysis and gene editing purposes.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Overview of this study. <bold>(A)</bold> Summarized phylogeny of the angiosperms analyzed based on amino acid sequences of selected Type II <italic>MADS-box</italic> genes, with a focus on the Asteraceae and the position of <italic>Taraxacum</italic> therein and with the ancestral whole-genome duplications and triplications (stars) and subfamilies (colors) indicated (left) and a sexual dandelion plant (right). <bold>(B)</bold> Phylogenetic tree of the Type II <italic>MADS-box</italic> genes found in the species studied (see panel A), based on the MADS- and K-box domain protein sequences, with the species subfamilies in the outer circle (see panel <bold>A</bold> for colors), the syntenic relationships by colored lines within the circle, and the <italic>MADS-box</italic> gene families indicated. <bold>(C)</bold> Dandelion floral tissues and stages used in the gene expression analysis: F = upper floral part and S = lower floral part, separated through the beak (dotted line) except for the youngest stage (F0S0), with stage 1 = bud just before opening; 2 = open flower; 3 = 3 days after pollination (DAP); 7 = 7 DAP. <sup>&#xa9;</sup> Kitty Vijverberg and Wei Xiong.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1198909-g001.tif"/>
</fig>
<p>Here, we analyzed our <italic>de novo</italic> assembly of a diploid sexual <italic>T. officinale</italic> genome together with the published whole-genome sequences of 32 other plant species. We performed genome-wide searches for <italic>MADS-box</italic> and <italic>TCP</italic> genes of the 33 species (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1A</bold>
</xref>) and constructed a synteny network of the identified genes to reveal their lineage-specific genome context and ancient tandem duplications, with a focus on the Asteraceae, its subclades Asteroideae and Cichorioideae, and <italic>Taraxacum</italic>. We examined the synteny versus phylogenetic trees based on <italic>MADS-box</italic> (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1B</bold>
</xref>) and <italic>TCP</italic> domain sequences and assessed a possible change in function after gene duplication or genomic context change <italic>via</italic> comparison to gene expression data in different floral developmental stages and tissues (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1C</bold>
</xref>) in dandelion. We also applied phylogenomic data to characterize the evolution of <italic>Asteraceae-specific MADS</italic> (<italic>AS-MADS</italic>) genes and their expression during floral development. Our results provide insights into the evolution of Asteraceae and their <italic>MADS-box</italic> and <italic>TCP</italic> genes, while the wealth of genome and transcriptome data serves as a reference for future comparative analyses and research on floral development in dandelion and beyond.</p>
</sec>
<sec id="s2" sec-type="results">
<label>2</label>
<title>Results</title>
<sec id="s2_1">
<label>2.1</label>
<title>Genome sequencing and assembly</title>
<p>The <italic>T. officinale</italic> genome of the sexual diploid plant FCh72 was sequenced with PacBio RSII and 10X Genomics on Illumina HiSeq2500 and optically mapped with BioNano. We obtained ~75&#xd7; coverage of PacBio reads with a mean subread length of 12,259 bp. The reads were assembled using Canu v1.3 (<xref ref-type="bibr" rid="B38">Koren et&#xa0;al., 2017</xref>). The assembly was scaffolded with the 10X and BioNano data and polished with the 10X Illumina reads. Haplo-contigs were collapsed where possible, and the assembly was polished and scaffolded multiple times in subsequent rounds (see Materials and Methods). The resulting assembly has a total genome size of 936 Mb (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S1</bold>
</xref>), which is slightly larger than the expected 831 Mb based on C-values (<uri xlink:href="https://cvalues.science.kew.org/">cvalues.science.kew.org/</uri>) and significantly larger than the estimated genome size based on k-mer analysis (~614 Mb; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S1</bold>
</xref>). Blobtools confirmed the absence of contamination (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S2</bold>
</xref>). This draft genome assembly has 4,059 scaffolds, an N50 size of 757 kb, and the longest scaffold of ~23 Mb (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S1</bold>
</xref>). The guanine-cytosine (GC) content is 37.0%. The mitochondrial (mt) genome was assembled in a single scaffold that showed high homology to the mt-DNA of the related species lettuce (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S3A</bold>
</xref>), whereas the chloroplast (cp) genome has not been recovered, likely due to bleaching prior to the harvesting of plant material (Material and Methods; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S3B</bold>
</xref>). Difficulties in assembling were posed by the heterozygosity of the genome, which was estimated at 1.5% with GenomeScope, showing two clear k-mer peaks (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S1</bold>
</xref>; k = 21). The Benchmarking Universal Single-Copy Orthologs (BUSCO) quality assessment of the genome assembly showed 95.4% completeness (2,219/2,326; <xref ref-type="table" rid="T1"><bold>Table 1</bold></xref>), with 1,759 (75.6%) complete and single copy and 460 (19.8%) complete and duplicated genes. The high duplicated BUSCO percentage is likely due to remaining alleles, in line with partial assembly in haplo-contigs.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Main characteristics of <italic>Taraxacum officinale</italic> genome.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Genome assembly and annotation</th>
<th valign="middle" align="center">Statistics</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">Assembly size (Mb)</td>
<td valign="middle" align="left">936</td>
</tr>
<tr>
<td valign="middle" align="left">Expected genome size (Mb)</td>
<td valign="middle" align="left">831</td>
</tr>
<tr>
<td valign="middle" align="left">Number of scaffolds</td>
<td valign="middle" align="left">4,059</td>
</tr>
<tr>
<td valign="middle" align="left">N50 super-scaffolds (Kb)</td>
<td valign="middle" align="left">757</td>
</tr>
<tr>
<td valign="middle" align="left">Heterozygosity (%)</td>
<td valign="middle" align="left">1.5</td>
</tr>
<tr>
<td valign="middle" align="left">BUSCO completeness of assembly (%)</td>
<td valign="middle" align="left">95.4</td>
</tr>
<tr>
<td valign="middle" align="left">Repeats (%)</td>
<td valign="middle" align="left">63</td>
</tr>
<tr>
<td valign="middle" align="left">Predicted high confident genes</td>
<td valign="middle" align="left">60,810</td>
</tr>
<tr>
<td valign="middle" align="left">Functional annotated transcripts</td>
<td valign="middle" align="left">56,560</td>
</tr>
<tr>
<td valign="middle" align="left">Sequence identical genes (%)</td>
<td valign="middle" align="left">2.7</td>
</tr>
<tr>
<td valign="middle" align="left">Protein &gt;99% similar genes (%)</td>
<td valign="middle" align="left">7.5</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Genome annotation</title>
<p>The assembled genome was repeat masked using RepeatModeler with long terminal repeat (LTR) detection and using RepeatMasker. In total, 63% of all bases were masked, which is similar to the repeat content of <italic>Taraxacum mongolicum</italic> and <italic>Taraxacum kok-saghyz</italic> (<xref ref-type="bibr" rid="B48">Lin et&#xa0;al., 2022</xref>). The repeat content was to a large extent driven by LTRs, namely, <italic>Copia</italic> (~214 Mb, 22.9% of the genome) and <italic>Gypsy</italic> (~135 Mb, 14.5%) retrotransposons (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S2</bold>
</xref>).</p>
<p>The genome was annotated using an RNAseq library based on four different tissue types of the sequenced dandelion genotype&#x2014;leaf, bud, open flower, and roots&#x2014;using BRAKER2 (see Materials and Methods). A total of 60,810 high-confident genes (i.e., size &#x2267;150 amino acids [aa] or &#x2267;50 aa with homology annotation) with 63,780 transcripts were found (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S3</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Data S1</bold>
</xref>). The mean gene length was 2,110 bp with on average 4.7 exons and a mean total Coding Sequence (CDS) length of 971 bp (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S3</bold>
</xref>). For 88.7% of the genes (56,560), the transcripts have a description, and 61.4% (37,324) are associated with at least one Gene Ontology (GO) term (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S3</bold>
</xref>).</p>
<p>A total of 1,739 high-quality genes (2.7%) were found to have at least one identical sequence copy in the annotation, and 4,788 genes (7.5%) showed more than 99% amino acid identity with another annotated gene (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S3</bold>
</xref>; indicated in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Data S1</bold>
</xref>) and are either true duplicates, closely related family members, or alleles at different haplo-contigs. The most abundant genes showed 15 and 11 copies, representing <italic>Histone H</italic>4 and <italic>GOS</italic>9-like isoforms, respectively (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S3</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Data S1</bold>
</xref>). BUSCO analysis of the translated transcripts showed 90% completeness with 19.4% duplicated BUSCOs.</p>
<p>An unfiltered gene set that includes the high confidence gene models, as well as smaller transcripts (50&#x2013;150 aa) and genes without homology annotation of 81,292 genes in total with 85,093 transcripts, was used in the gene expression analyses and synteny mapping results (see below).</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Genome comparison between <italic>Taraxacum</italic> spp. assemblies</title>
<p>The <italic>T. officinale</italic> genome assembly was compared to that of the recently published whole-genome sequences of two other sexual diploid <italic>Taraxacum</italic> species, <italic>Taraxacum mongolica</italic> (<italic>Tmo</italic>) and <italic>T. kok-saghyz</italic> (<italic>Tks</italic>) (<xref ref-type="bibr" rid="B48">Lin et&#xa0;al., 2022</xref>), showing a relatively fragmented assembly (4,059 scaffolds versus 65 in <italic>Tmo</italic> and 160 in <italic>Tks</italic>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S4</bold>
</xref>). The annotation of gene space was, however, far more complete in <italic>T. officinale</italic> based on the BUSCO results (90% completeness versus 69% in <italic>Tmo</italic> and 74% in <italic>Tks</italic>). The GC content of 37% was similar to the other two species, whereas the heterozygosity varied from 1% (<italic>Tks</italic>) to 1.5% (<italic>Tof</italic>). The assemblies are collinear without major structural rearrangements if compared by alignments and dot plots (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S4</bold>
</xref>).</p>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Synteny network analysis: identification of <italic>Asteraceae-specific MADS-box</italic> and <italic>TCP</italic> gene synteny clusters</title>
<p>To compare the genomic context of genes in Asteraceae and with selected outgroups, we conducted a synteny network analysis of 33 angiosperm species with high-quality whole-genome sequences (12 Asteraceae, 18 other Asterids, 2 Rosids, and 1 early-diverging Angiosperm; <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1A</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S5</bold>
</xref>). Within the Asteraceae, six species were from the Cichorioideae, including our <italic>de novo</italic> sequenced <italic>T. officinale</italic> (<italic>Tof</italic>), two additional <italic>Taraxacum</italic> species (<italic>Tmo</italic> and <italic>Tks</italic>) (<xref ref-type="bibr" rid="B48">Lin et&#xa0;al., 2022</xref>), and three <italic>Lactuca</italic> species. In addition, four species of the Asteroideae and two of the Carduoideae were analyzed. The synteny network database was built using the SynNet pipeline (<xref ref-type="bibr" rid="B106">Zhao and Schranz, 2017</xref>; <xref ref-type="bibr" rid="B28">Gamboa-Tuz et&#xa0;al., 2022</xref>) and contained 718,070 nodes (genes found in syntenic blocks) and 7,603,091 edges (connections between syntenic genes), data on which subsequent analyses were based. We further focused on the sub-networks of the <italic>MADS-box</italic> and <italic>TCP</italic> gene families.</p>
<p>With the use of HMMER analysis of proteome sequences of the 33 species, the <italic>MADS-box</italic> genes were identified by searching for the <italic>MADS-box</italic> (SRF-TF: PF00319.20) and <italic>K-box</italic> (PF01486.20) domains and the <italic>TCP</italic> genes by searching for the <italic>TCP</italic>-specific <italic>bHLH</italic> domain (PF03634.15). We further classified the identified candidates by their sequence similarity and phylogenetic relationship to well-known reference genes, particularly from <italic>Arabidopsis</italic>, <italic>Petunia</italic>, and <italic>Gerbera</italic> (<italic>MADS-box</italic> genes), and <italic>Arabidopsis</italic> and rice (<italic>TCP</italic> genes) (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S6</bold>
</xref>). In total, 2,525 <italic>MADS-box</italic> and 1,019 <italic>TCP</italic> genes were identified (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Data S2</bold>
</xref>). After classification, the normalized gene count (i.e., Z-score) for each clade was calculated. Results identified several gene expansions in different plant families (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S7</bold>
</xref>), particularly, Type I and <italic>MIKC</italic>* in the Solanaceae and <italic>MIKC</italic>
<sup>c</sup> and <italic>CYC</italic> in the Asteraceae. Within <italic>Taraxacum</italic>, we found more <italic>MADS-box</italic> genes in <italic>T. officinale</italic> (78) than in <italic>T. mongolicum</italic> (54) and <italic>T. kok-saghyz</italic> (57) and a similar number of <italic>TCP</italic> genes (31-34), with the former possibly as a result of their genome completeness.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>    <p>Heatmap of <italic>MADS-box</italic> and <italic>TCP</italic> gene counts normalized per gene clade. Target genes were identified and classified into sub-clades (row) for each species (column), and the count was scaled (cell) by using z-scores. Colors illustrate the deviation from average, with blue for smaller numbers and red for larger numbers. <italic>Erigeron breviscapus</italic> was excluded from this visualization due to its incompleteness of target genes. Species subfamilies are indicated in <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1A</bold>
</xref>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1198909-g002.tif"/>
</fig>
<p>The complete lists of <italic>MADS-box</italic> and <italic>TCP</italic> genes were used to extract their synteny sub-networks from the whole network database. The resulting <italic>MADS-box</italic> sub-network contained 1,677 nodes and 16,697 syntenic edges, and the <italic>TCP</italic> sub-network contained 835 nodes and 14,716 syntenic edges (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Data S3A, B</bold>
</xref>). To associate the syntelogs (the syntenic homologous genes) with each other, we conducted phylogenetic profiling of all obtained synteny clusters of <italic>MADS-box</italic> and <italic>TCP</italic> proteins and visualized the primary clusters in a heatmap for each family (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Data S3C, D</bold>
</xref>). For this, the number of syntelogs in each cluster was counted for each species, and the clusters were ordered by hierarchical clustering based on the index of dissimilarity derived from the syntelog counts. Then, the clusters that were specific to the Asteraceae, Cichorioideae, and/or <italic>Taraxacum</italic> were determined. In <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>, we highlight 15 synteny clusters that illustrate our most relevant findings: the Asteraceae or <italic>Taraxacum</italic>-specific <italic>MADS-box</italic> clusters <italic>AG</italic>-like (CL4&#x2013;5) and <italic>SEP3</italic>/<italic>FLC</italic>/<italic>AS-MADS</italic> (<italic>SFA</italic>; CL7), and <italic>TCP</italic>-<italic>PCF</italic> cluster 15 (CL15), and absence of <italic>AG-</italic>like cluster 2 (CL2) and <italic>TCP</italic>-<italic>PCF</italic> cluster 14 (CL14). The selected clusters are also displayed in a network format, pruning the non-primary syntelogs (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3B</bold>
</xref>).</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>    <p>Synteny network clusters revealed the Asteraceae-specific context of several <italic>MADS-box</italic> and <italic>TCP</italic> genes important in floral development. <bold>(A)</bold> Phylogenetic profiling map showing a selection of <italic>MADS-box</italic> (<italic>AG</italic>-like and <italic>SEP</italic>, <italic>FLC</italic>, <italic>AS-MADS</italic> [SFA] clades) and <italic>TCP</italic> (<italic>PCF</italic> clade) gene clusters including the ones that showed a lineage-specific context: Cluster 4 (CL4) and CL7 for the Asteraceae, CL15 for the Cichorioideae, and CL5 for <italic>Taraxacum</italic>. Gradient green cells represent the number of syntelogs (syntenic homologs) for each cluster in the different species; the phylogenetic tree (left) and subspecies (right) are as in <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1A</bold>
</xref>. <bold>(B)</bold> The same clusters are visualized in a network, particularly showing the syntenic relationships between <italic>SEP</italic>, <italic>FLC</italic>, and <italic>AS-MADS</italic>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1198909-g003.tif"/>
</fig>
<p>The <italic>AG</italic>-like genes include the C class gene <italic>AGAMOUS</italic> (<italic>AG</italic>; CL1, <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>) and C/D class genes <italic>SHATTERPROOF</italic>-like (<italic>SHP</italic>-like; CL2) and <italic>SEEDSTICK</italic>-like (<italic>STK</italic>-like; CL3&#x2013;5). <italic>AG</italic> is critical for anther and carpel development; <italic>SHP</italic> regulates aspects of fruit development in core eudicots, such as fruit dehiscence in dry fruits (e.g., <italic>Arabidopsis</italic>) and fruit expansion and ripening in fleshy fruits (e.g., tomato); <italic>STK</italic> is involved in ovule development. For <italic>AG</italic>, most orthologous genes resided in the conserved synteny cluster 1 (CL1; <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>), including two genes in <italic>T. officinale</italic>. Syntelog(s) of <italic>SHP</italic> (CL2) were absent in the Asteraceae. Since Asteraceae fruits are single-seeded indehiscent dry fruits (cypsela), this is consistent with a loss or absence of a gain of <italic>SHP</italic> homologs. More than 60% of the <italic>STK</italic> orthologs were in one single synteny cluster (CL3), mainly from non-Asteraceae species. <italic>STK</italic> orthologs from Asteraceae exclusively formed a second synteny cluster (CL4). Moreover, there was an extra pair of syntenic <italic>STK</italic> genes unique in <italic>Taraxacum</italic> species (CL5) and one more present in <italic>T. officinale</italic> only (To_STK_UN; since unique, this is not detected as a cluster). Possibly, these Asteraceae- and <italic>Taraxacum</italic>-specific clusters are associated with a diverged ovule developmental program in these taxa, but this needs additional support and validation.</p>
<p>The <italic>SEP</italic>3-like genes, E class genes of floral development, exemplify another Asteraceae-specific relationship. <italic>SEP</italic> genes underlie the development of all floral organs in many species. A conserved cluster of <italic>SEP</italic>3-like genes was shared by all genomes analyzed, including most Asterids, two Rosids, and the first-diverging angiosperm <italic>Amborella trichopoda</italic> (CL6; <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>). In addition, the majority of another <italic>SEP</italic>3-like cluster (CL7) was predominantly Asteraceae-specific (plus <italic>Coriandrum sativum</italic> [Apiaceae]) and likely a transposed duplicated copy preserved in the Asteraceae.</p>
<p>A third example of Asteraceae-specific synteny was found in <italic>TCP</italic> class II <italic>PCF</italic> genes, which are plant-specific transcription factors that play a role in cell differentiation and plant growth. For <italic>PCF</italic> genes, we identified a Cichorioideae-specific cluster (CL15; <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>), while a second cluster was specific for non-Asteraceae (CL14), hinting at a transposition in the ancestor of the Cichorioideae. The other six <italic>PCF</italic> clusters were relatively conserved in all species analyzed (CL8&#x2013;13). Similarly, the <italic>TCP</italic> subclasses, <italic>CIN</italic> and <italic>CYC</italic> (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Data S3D</bold>
</xref>), were conserved between the Asteraceae and non-Asteraceae.</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Expression analysis of floral tissues and stages</title>
<p>To further analyze the lineage-specific synteny found in the Asteraceae as well as to obtain a global overview of the genetic basis underlying floral development in dandelion, we generated transcriptomes of a total of 25 samples of the sequenced plant FCh72. These included triplicates of very young whole buds (F0S0; initiating organs), older buds just before opening (F1 and S1), and open flowers (F2 and S2), the latter two stages with the florets separated into an upper (F; organs in all four floral whorls) and lower (S; the inner floral whorl/ovary/seed) part by cutting through the beak (<xref ref-type="fig" rid="f1"><bold>Figure 1C</bold></xref>; see for exact stages and the method of <xref ref-type="bibr" rid="B99">Vijverberg et&#xa0;al., 2021</xref>), and duplicates of these floral parts at 3 days after pollination (3 DAP; F3 and S3) and 7 DAP (F7, pappus only; S7, ripening seeds) and leaves (LF). RNA sequencing generated on average 33,8 million read pairs per sample, of which &gt;99.9% was maintained after trimming and on average 98.1% mapped to the annotated <italic>T. officinale</italic> genome (see <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S8</bold>
</xref> for read and mapping statistics and <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Data S4</bold>
</xref> for expression values).</p>
<p>The quality of the data was checked with a principal coordinate analysis (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S5</bold>
</xref>). This showed clear clustering of the replicates per stage and tissues, with particularly tight clustering of replicates in the youngest stage (F0S0) and younger seed stages (S1 and S2). In the upper floral parts (F), some more variation was detected within and between replicates, reflecting fast changes in gene expression in these rapidly developing tissues and close successive stages. The leaf duplicates also nicely clustered together and diverged from the floral tissues.</p>    <p>Expression patterns were visualized in a heatmap (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S6</bold>
</xref>), which confirmed the reproducibility of the replicates and the quality of the data. Results showed clustering of similar tissues in subsequent stages, particularly of (F0S0), S1, S2 and F1, F2, and associated &#x201c;expression blocks&#x201d; (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S6</bold>
</xref>, blocks 1&#x2013;12; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Data S4</bold>
</xref>, columns S and T). Blocks with the highest numbers of genes were found among the youngest stages, particularly blocks 2 (F0S0, S1, and S2) and 3 (F1) and to a lesser extent 1 (F0S0) and 4 (F1 and F2) (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S9A</bold>
</xref> and graph therein), indicating high transcriptional activity in young floral developmental stages. A relatively high number of genes was also found in block 10 (F3 and F7), indicating diverse gene activity in the degenerating florets. The overall expression pattern based on summed values over all 25 samples, and their classification in seven groups from &#x201c;true zero&#x201d; to &#x201c;extremely high&#x201d; expression (&gt;10,000 TPM) (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Data S4B</bold>
</xref>, columns AT, BT, BU-BX, and summary thereof in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S9B</bold>
</xref>) showed a total of 49,102 genes expressed (60.4%; sum &gt; 1 TPM), with a minority of genes with very high (7.4%; sum &gt; 1,000 TPM) to extremely high (0.5%; sum &gt; 10,000 TPM) expression. The comparison of Total Exon Reads (TERs) versus Unique Gene Reads (UGRs) showed similar expression for most genes (82.9%), but a small part (1.5%) showed significantly higher TERs, and a larger part (15.6%) showed significantly higher UGRs. The most highly expressed genes (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S9C</bold>
</xref>) included four genes that each showed a summed expression of &gt;100,000 TPM, of which three were related to anthers: <italic>Pollen allergen Art v</italic>1-like (2x) and <italic>Anther-specific SF18</italic>-like, and one hypothetical protein. Other highly expressed genes included <italic>Elongation Factor</italic> 1&#x3b1; (<italic>EF</italic>1&#x3b1;), <italic>Histone</italic> 3 (<italic>H</italic>3), <italic>Acyl-CoA-binding protein</italic>, and <italic>Polyubiquitin</italic> (additional information in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S9</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Data S4B, C</bold>
</xref>).</p>
<p>Insights into the expression of genes related to floral development, including the <italic>MADS-box</italic> Type I and II genes and <italic>TCP</italic> genes (and <italic>APETALA-</italic>2 [<italic>AP2</italic>]), were based on the averaged expression value of genes per tissue type and stage (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Data S4C</bold>
</xref>, with in columns F, G, and H the relevant genes indicated; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S10</bold>
</xref> for extraction of these genes). Several genes (13 of the 78 <italic>MADS-box</italic> genes and 5 of the 33 <italic>TCP</italic> genes; 15%&#x2013;17%) were represented by two alleles due to their assembly in haplo-contigs and taken together and their sum of expression used in the final analysis (indicated with a double gene name and asterisk in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S10</bold>
</xref>). Gene expression is visualized in a heatmap per gene subclass (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures S7A&#x2013;D</bold>
</xref>).</p>
<p>The heatmap of the <italic>MADS-box</italic> Type II genes showed clustering of the young upper floral tissues (F0S0, F1, and F2), seed tissues (S1&#x2013;7), and older upper floral tissues (F3 and F7) and a clear differential expression in leaves (LF) (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S7A</bold>
</xref>). Virtually all ABC(D)E genes (indicated with an A&#x2013;E prefix in the gene name) were expressed in (subsets of) the floral tissues, confirming the expected expression patterns as well as the homology of the genes identified in the <italic>Taraxacum</italic> genome. For example, the class B gene <italic>PISTILLATA</italic> (<italic>PI</italic>) was highly expressed in young upper floral tissues only, and the class D gene <italic>AGL</italic>11-like was particularly expressed in the ovary and seed tissues. Most other <italic>MADS-box</italic> Type II genes (indicated with an M-prefix in the gene name) showed (very) low expression in the floral tissues, further confirming the important role of <italic>MADS-box</italic> Type II ABC(D)E genes in floral development.</p>
<p>Based on the expression of <italic>MADS-box</italic> Type I genes, the seed tissues clustered together as did the upper floral tissues (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S7B</bold>
</xref>), supporting their important role in ovule and seed development. A few genes were specifically expressed in young buds, <italic>AGL</italic>47 and <italic>AGL</italic>62, which also confirms expectations. The heatmap of <italic>TCP</italic> Class I and Class II gene expression showed a similar clustering of tissues as the <italic>MADS-box</italic> Type II genes (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S7C</bold>
</xref> versus <xref ref-type="supplementary-material" rid="SM1">
<bold>S7A</bold>
</xref>), also supporting their role in floral development. In particular, the <italic>CIN</italic> genes were highly expressed in the floral tissues in addition to some <italic>PCF</italic> genes, while most <italic>CYC</italic> genes showed (very) low expression. Examples of tissue specificities are the high expression of a <italic>TCP</italic>5-like gene in young buds and a <italic>TCP</italic>8-like gene in tissues after pollination (F3, S3, F7, and S7). Finally, the expression of the <italic>AP2</italic>-like homologs, an A class non-<italic>MADS-box</italic> transcription factor gene, is shown (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S7D</bold>
</xref>), of which some showed expression in the young buds according to their role in early floral organ ontogenesis.</p>
</sec>
<sec id="s2_6">
<label>2.6</label>
<title>Phylogenomic analysis of <italic>MADS-box</italic> and <italic>TCP</italic> genes, Synthesis</title>
<p>To depict the evolutionary relationships between the different <italic>MADS-box</italic> and <italic>TCP</italic> genes, we mapped the syntenic connections (genomic context) onto the gene trees (gene sequence divergence; <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1B</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S8</bold>
</xref>). Next, we extracted the subsets of genes associated with lineage specificity within the Asteraceae for more detailed analysis and comparison of their expression in dandelion (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>). The gene trees were based on the amino acid alignments of the <italic>MADS</italic> domain (<italic>MADS-box</italic> genes) and <italic>bHLH</italic> domain (<italic>TCP</italic> genes), respectively, confirming the splitting of <italic>MADS-box</italic> genes into Type I and Type II (including <italic>MIKC</italic>* and <italic>MIKC</italic>
<sup>c</sup>) and <italic>TCP</italic> genes into <italic>PCF</italic>, <italic>CIN</italic>, and <italic>CYC/TB1</italic> genes. To improve the resolution of the <italic>MADS-box MIKC</italic>
<sup>c</sup> genes, an independent phylogenetic tree was built using 1,154 Type II <italic>MIKC</italic>
<sup>c</sup> genes where the K-box domain(s) was included in the alignment with the <italic>MADS-box</italic> domain (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Data S2a, column C</bold>
</xref>; <xref ref-type="fig" rid="f1">
<bold>Figures&#xa0;1B</bold>
</xref>, <xref ref-type="fig" rid="f4">
<bold>4A, B</bold>
</xref>). Both the phylogenies of the <italic>MADS-box MIKC</italic>
<sup>c</sup> genes (<xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;1B, 4A, B</bold>
</xref>) and the <italic>TCP</italic>-<italic>PCF</italic> genes (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4C</bold>
</xref>) clearly classified the various gene clades. The syntenic relationships (colored connection lines within the circles) visualize (in)congruencies with the gene evolution (phylogenetic tree), with the Asteraceae sub-families highlighted (colored sections of the circle). Both the <italic>MIKC</italic>
<sup>c</sup> and <italic>PCF</italic> results showed a high level of similarity between the syntenic and gene sequence relationships, with some interesting exceptions that are described in the next paragraphs.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>    <p>Phylogenetic trees of the <italic>MADS-box</italic> and <italic>TCP</italic> gene clades that include genes with lineage-specific genomic context (see <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>)&#x2014;<italic>AG</italic>-like, <italic>SEP</italic>3, and <italic>PCF</italic> genes&#x2014;based on <italic>MADS-box</italic> and <italic>K-box</italic> <bold>(A, B)</bold> and bHLH <bold>(C)</bold> domain amino acid alignments, respectively (left) and gene expression in different floral stages and tissues (right). Species subclades are indicated in the circle (colors as in <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1A</bold>
</xref>) and synteny clusters with colored lines within the circle. <bold>(A)</bold> The <italic>AG</italic>-like clade. This shows three clades based on the gene tree and five based on their synteny: CL1 (light green) shared by all species and putatively ancestral, CL2 (the <italic>SHP</italic> clade, yellow), which is present only in non-Asteraceae, and CL3&#x2013;5 (the <italic>STK</italic> clade, dark green and red lines), indicating gene duplications and divergence. Different expression patterns of the <italic>AG</italic>-like genes in <italic>Taraxacum</italic> floral tissues support their divergence. <bold>(B)</bold> <italic>SEP</italic>3 clade. This shows two clades based on both the gene sequence and syntenic relationships, indicating high conservation. CL7 is unique to the Asteraceae, possibly as a result of a transposition after gene duplication in the ancestor of the Asteraceae. Overall similar expression of the <italic>SEP</italic>3-like genes in <italic>Taraxacum</italic> supports their conservation. <bold>(C)</bold> <italic>PCF</italic> clade. This shows three subclades in the gene tree, while CL8 (yellow lines) and CL11 (pink lines) both contain syntenically connected genes from all three subclades, indicating paralogous relationships. Asteraceae-specific CL15 genes (fluorescent green lines) are monophyletic and might be a result of duplication within the second <italic>PCF</italic> clade (CL12 and CL13). Divergence in their expression pattern supports that these genes are diverging.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1198909-g004.tif"/>
</fig>
<p>In <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1B</bold>
</xref>, a difference between the syntenic and genetic relationships was particularly seen for <italic>B-sister</italic> (<italic>BS</italic>) versus <italic>PISTILLATA (PI</italic>) genes (gray lines), <italic>AGAMOUS</italic>-like 6 (<italic>AGL</italic>6) versus <italic>SUPPRESSOR OF OVEREXPRESSION OF CONSTANS</italic> 1 (<italic>SOC</italic>1)/<italic>TOMATO MADS-box</italic> gene 3 (<italic>TM</italic>3) genes (dark green lines), and <italic>SEP</italic>-like versus <italic>APETALA</italic> 1 (<italic>AP</italic>1)/FRUITFUL (<italic>FUL</italic>) genes (yellow lines). These genes show a clear close relationship based on their genomic context (are syntenic) but occur in different clades in the phylogenetic tree based on their sequences. It suggests that these genes have diverged, possibly as a result of selection or by a duplication followed by a loss of one of the two copies. <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1B</bold>
</xref> also visualizes the <italic>MADS-box</italic> lineages that are Asteraceae specific, one within the <italic>AG</italic>-like clade (<italic>STK</italic>-like genes, red lines) and one within the <italic>SFA</italic> clade (<italic>SEP</italic>3-like genes, dark pink lines). These two syntenic clusters are shown separately in <xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;4A, B</bold>
</xref> and described below.</p>
<p>The <italic>AG</italic>-like (<italic>AG</italic>, <italic>SHP</italic>, and <italic>STK</italic>) gene tree, supported by syntenic connections (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>, phylogeny), showed the three gene clades with five synteny clusters: the <italic>AG</italic> clade (CL1), shared by all species and putatively ancestral, the <italic>SHP</italic> clade (CL2), present in non-Asteraceae species only, and the <italic>STK</italic> clade (CL3&#x2013;5), showing evidence for gene duplications and divergence. The separation of the three <italic>AG</italic>-like gene clusters is in line with the previous C/D class gene classification in angiosperms (<xref ref-type="bibr" rid="B40">Kramer et&#xa0;al., 2004</xref>). The tree validates the overall high conservation of <italic>AG</italic> genes and the absence of <italic>SHP</italic>-like genes in the Asteraceae, as mentioned above in relation to the synteny analysis (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>). In addition, the <italic>AG</italic>-like gene tree shows that the genes in the <italic>STK</italic>-like clusters (CL3, dark green lines; CL4 and CL5, red lines) underwent different modes of evolution: the genes in CL3 are syntenically related but distributed over different clades based on their sequences, while within the Asteraceae, the genes in CL3 are genetically related to those in CL4 but syntenically diverged. The extra <italic>STK</italic>-like copy in <italic>Taraxacum</italic> (CL5), and another copy found in <italic>T. officinale</italic> only (To_STK_UN), suggest a unique evolution of <italic>STK</italic>-like genes in dandelions. Different expression patterns in the <italic>AG</italic>-like genes in <italic>Taraxacum</italic> (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>, floret cartoon), with overall high expression of CL1 genes (<italic>AG</italic>, C class, dark red), and various, less high expression of CL4, CL5, and To_STK_UN (i.e., similar to CL5, but with less high [yellow] expression in S1&#x2013;S7; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S10</bold>
</xref>) genes, support their divergence.</p>
<p>For the <italic>SEP</italic>3 orthologous group (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4B</bold>
</xref>, phylogeny), most gene copies resided in CL6 (light pink lines), and these form one clade in the gene tree, supporting the high conservation of this expanded gene group in genomic as well as sequence context. A second group of syntelogs was found in the Asteraceae (CL7; red lines) and is also supported by the gene tree. Possibly, these genes result from a transposition after duplication in the ancestor of the Asteraceae. The expression of the <italic>SEP</italic>3-like genes in <italic>Taraxacum</italic> (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4B</bold>
</xref>, floret cartoon) shows some reduction in mature floral tissues in the conserved, putatively ancestral, CL6 gene, and overall high expression in the Asteraceae-associated CL7 gene. This supports the importance of E class genes in a wide range of floral developmental aspects and indicates that the two gene copies have not (yet) much diverged and may have remained a similar function.</p>
<p>
<italic>PCF</italic> genes form a large clade within the <italic>TCP</italic> genes and were divided into three subclades based on their gene tree (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4C</bold>
</xref>, phylogeny). Cluster 8 (yellow lines) and CL11 (pink lines) both contain syntenically connected genes from all three subclades, indicating their paralogous relationships. Asteraceae-specific CL15 genes (fluorescent green lines) are monophyletic according to the gene tree and likely a result of duplication within the second <italic>PCF</italic> clade (CL12 and CL13). Divergence in their expression pattern (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4C</bold>
</xref>, floret cartoon) suggests that these genes are diverging.</p>
<p>To summarize, the extracted gene trees of <italic>AG</italic>-like (CL1&#x2013;5), <italic>SEP</italic>3 (CL6&#x2013;7), and <italic>PCF</italic> genes (CL8&#x2013;15) confirmed the orthologous relationship of genes within Asteraceae-specific synteny clusters (CL4, 5, 7, and 15) as well as of genes widely conserved within the angiosperms (CL1, 6, and 8&#x2013;13) or being non-Asteraceae specific (e.g., CL2 and 14). By combining the gene phylogeny and synteny, we validated the occurrence of duplications and/or transpositions of <italic>AG</italic>-like, <italic>SEP</italic>3, and <italic>PCF</italic> genes in ancestral species of the Asteraceae or subsets thereof and added an extra level of evolutionary history to the traditional gene tree phylogenies. The comparison of the expression of these genes in different floral tissues in dandelion added another level of information by either supporting or not their divergence. Confirmation of the results by expression data in other Asteraceae in the literature, e.g., <xref ref-type="bibr" rid="B61">Ning et&#xa0;al., 2019</xref> (lettuce) and <xref ref-type="bibr" rid="B102">Won et&#xa0;al., 2021</xref> (<italic>Chrysanthemum</italic>), was inconclusive mainly as a result of different tissues and stages.</p>
</sec>
<sec id="s2_7">
<label>2.7</label>
<title>Presence of <italic>AS-MADS</italic> orthologs outside the Asteraceae and interference with their evolution, function, and relationship to <italic>SEP</italic>3 and <italic>FLC</italic>
</title>
<p>In a recent paper on <italic>MADS-box</italic> genes in <italic>Chrysanthemum</italic>, a unique, monophyletic clade was found, including 11 <italic>Chrysanthemum</italic> genes (<italic>CnMADS</italic>54&#x2013;64) and one from lettuce (<italic>LsMADS</italic>16). These were named <italic>Asteraceae-specific MADS-box</italic> (<italic>AS-MADS</italic>) genes (<xref ref-type="bibr" rid="B102">Won et&#xa0;al., 2021</xref>). To characterize this potentially novel Asteraceae sub-group, we included <italic>LsMADS</italic>16 as a reference in our <italic>MADS-box</italic> search and annotation. Most <italic>AS-MADS</italic> genes were found to belong to the syntenic cluster 6 (CL6, <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>), which is one of the largest clusters in our analysis with 99 nodes. CL6 includes <italic>SEP</italic>3 and <italic>FLC</italic> in addition to <italic>AS-MADS</italic> genes (<italic>SFA</italic>), and its network showed nodes of <italic>SEP</italic>3-like genes that are widely but loosely connected to the sub-clusters of <italic>FLC</italic>-like and <italic>AS-MADS</italic>-like genes, both inter- and intra-specifically (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3B</bold>
</xref>, <italic>SFA</italic> network). We analyzed the relationships and expression of the <italic>SFA</italic> genes in more detail (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>). The syntenic relationships between distant clades of the same gene family can indicate ancient tandem duplication (TD) events. For example, an ancient tandem duplication of an ancestral <italic>MADS-box</italic> gene in addition to several rounds of WGD is supposed to have resulted in the present tandem pairs <italic>SEP1</italic>-like&#x2013;<italic>AP1</italic>, <italic>TM3</italic>&#x2013;<italic>AGL6</italic>, and <italic>SEP</italic>3&#x2013;<italic>FLC</italic> (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1B</bold>
</xref>). For the <italic>SFA</italic> cluster in our study, the synteny between <italic>SEP</italic>3 and <italic>FLC</italic> confirmed the previously identified TD (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5A</bold>
</xref>), which was further supported by the presence of a <italic>SEP</italic>3&#x2013;<italic>FLC</italic> tandem of <italic>Solanum tuberosum</italic>, <italic>Coffea canephora</italic>, and <italic>Beta vulgaris</italic>, found in a genome-wide search for tandem duplicates of <italic>MADS-box</italic> genes (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S11</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Data S5</bold>
</xref>). Moreover, syntenic relationships (i.e., colored lines connect genes in the phylogenic tree) were found between <italic>SEP</italic>3 and <italic>AS-MADS</italic> genes (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3B</bold>
</xref> [SFA plot] and <xref ref-type="fig" rid="f5"><bold>5A</bold></xref>), and an example of a <italic>SEP</italic>3&#x2013;<italic>AS-MADS</italic> tandem was found in <italic>Chenopodium quinoa</italic> (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S11</bold>
</xref>). Phylogenetically, the gene tree showed that <italic>AS-MADS</italic> is a sister clade of <italic>FLC</italic> (indicated in orange and beige, respectively, in the inner circle of <xref ref-type="fig" rid="f5">
<bold>Figures&#xa0;5A, B</bold>
</xref>), with a similar genomic context (pink connection lines within the phylogenetic tree in <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5A</bold>
</xref>), indicating an extra round of duplication before the divergence of these genes after the ancient TD. In addition to WGDs, a tandem homolog of <italic>AS-MADS</italic>-<italic>FLC</italic> was found in the potato genome (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S11</bold>
</xref>); therefore, a TD could also have been responsible for the paralogous clades of <italic>AS-MADS</italic> and <italic>FLC</italic>.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>    <p>Inferred evolution of <italic>Asteraceae-specific MADS-box</italic> (<italic>AS-MADS</italic>) gene. <bold>(A)</bold> Phylogenetic tree of the <italic>MADS-box SFA</italic> clade (see <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>), based on <italic>MADS-box</italic> and <italic>K-box</italic> protein sequences, with species subclades indicated in the outer circle (A; colors as in <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1A</bold>
</xref>); <italic>SEP</italic>3 (see also <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4B</bold>
</xref>), <italic>FLC</italic>, and <italic>AS-MADS</italic> genes in the inner circle; synteny clusters with colored lines within the circle, CL6 (pink, see also <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>) and other clusters (gray); and the tree rooted by Type I MADS-box reference genes. The comparison suggests a duplication event of <italic>AS-MADS</italic> related to its syntelogs <italic>SEP3</italic> and <italic>FLC</italic>. The presence of <italic>AS-MADS</italic> (red in the inner circle) in tree non-Asteraceae species (gray and blue in the outer circle: coriander, grape, and kiwi) indicates an ancient origin of <italic>AS-MADS</italic> gene for all flowering plants. <bold>(B)</bold> Gene tree with the <italic>SEP</italic>3 clade excluded for a better view of the paralogous relationship between <italic>AS-MADS</italic> and <italic>FLC</italic>. The solid black dot squared by dashline points to <italic>LsMADS</italic>16, <italic>AS-MADS</italic> gene found in lettuce (<xref ref-type="bibr" rid="B102">Won et&#xa0;al., 2021</xref>). The hollow dots pinpoint the nine <italic>FLC</italic> and one <italic>AS-MADS</italic> in dandelion, for which the expression is shown in panel <bold>(D). (C)</bold> Hypothesized evolutionary history of <italic>AS-MADS</italic> in which an ancestral (Type II <italic>MIKC</italic>
<sup>c</sup> <italic>MADS-box</italic>) gene underwent a tandem duplicated (TD) and then went through a polyploidy event followed by the divergence of the second copy into <italic>FLC</italic> and <italic>AS-MADS</italic>. <bold>(D)</bold> Expression heatmap of the nine <italic>FLC</italic> and one <italic>AS-MADS</italic> genes found in <italic>Taraxacum officinale</italic> in the different floral stages and tissues analyzed (indicated as cartoons below the heatmap), with the different colors indicating no or very low (blue) to medium (yellow) or high (red) expression. The results show differences between the different FLC genes and particularly a deviating expression of <italic>AS-MADS</italic>, suggesting neo-functionalization.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1198909-g005.tif"/>
</fig>
<p>Based on the presence and sequence similarity of the MADS-domain, 57 potential <italic>AS-MADS</italic> candidates were first identified in the 33 species studied (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Data S2A</bold>
</xref>). After filtering on the presence of also the K-box domain and curation by phylogeny, 13 <italic>AS-MADS</italic> genes were retained for downstream investigation (<xref ref-type="fig" rid="f5">
<bold>Figures&#xa0;5A, B</bold>
</xref>). Interestingly, out of these 13 genes, three were from non-Asteraceae species (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Data S2A</bold>
</xref>), namely, <italic>C. sativum</italic> (coriander), <italic>Actinidia chinensis</italic> (kiwi), and <italic>Vitis vinifera</italic> (grape), whereas an <italic>AS-MADS</italic> gene was absent from the basal angiosperm <italic>A. trichopoda</italic>. This suggests that <italic>AS-MADS</italic> originated after the formation of the core angiosperms, but from a much more ancient root before the emergence of the Asteraceae family. Combining the synteny and phylogeny results, we infer that the <italic>AS-MADS</italic> and <italic>FLC</italic> genes probably derived from a duplication (WGD or TD) of the ancestral TD of their common ancestor (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5C</bold>
</xref>, copy 2) and the ancestor of <italic>SEP3</italic> (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5C</bold>
</xref>, copy 1) followed by their divergence.</p>
<p>As mentioned above, the <italic>FLC</italic> clade is close to the <italic>AS-MADS</italic> clade in different aspects. In lettuce and <italic>Chrysanthemum</italic>, the copies of <italic>FLC</italic> and <italic>AS-MADS</italic> show various expression patterns in different floral developmental stages and tissues (<xref ref-type="bibr" rid="B61">Ning et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B102">Won et&#xa0;al., 2021</xref>). In our dandelion genome and based on the criterion of encoding the complete <italic>MIKC</italic>
<sup>c</sup> protein (i.e., containing the MADS domain and K-box domain), we found a total of nine <italic>FLC</italic> (To_FLC_1&#x2013;9) and one <italic>AS-MADS</italic> (To_ASMADS_1) genes (indicated in <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5B</bold>
</xref> and <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S10</bold>
</xref>, column G). These 10 genes are presented in the expression heatmap of <italic>FLC</italic>-like and <italic>AS-MADS</italic>-like genes in <italic>T. officinale</italic> (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5D</bold>
</xref>). All of them were expressed in at least one stage and tissue. Genes with a rather high expression (&gt;5 with pink or red color in <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5D</bold>
</xref>) can be divided into two major groups: one that shows a more general high expression, such as To_FLC_4, To_FLC_6 and To_FLC_9, and another that shows expression in a specific stage or tissue, such as To_FLC_2 in stage 3 (F3 and S3) and To_ASMADS_1 in the young bud/ovary (F0S0 and S1). Thus, the expression pattern validated the distinctiveness of To_ASMADS_1 in contrast to the different <italic>FLC</italic> genes in dandelion. To conclude, our phylogenomic and transcriptomic data suggest a non-Asteraceae-specific origin of <italic>AS-MADS</italic> genes and advocate its different function for dandelion floral development compared to <italic>FLC</italic>.</p>
</sec>
</sec>
<sec id="s3" sec-type="discussion">
<label>3</label>
<title>Discussion</title>
<p>Here, we provide the first complete overview and first inventory in <italic>Taraxacum</italic> of <italic>MADS-box</italic> and <italic>TCP</italic> genes in the Asteraceae by comparing their results with other Asterids and representative outgroups. Our search was robust, and the identified gene numbers in the selected species were comparable to those in previous studies; for example, 82 <italic>MADS-box</italic> genes, including 23 Type I and 59 Type II genes, were reported in lettuce (<xref ref-type="bibr" rid="B61">Ning et&#xa0;al., 2019</xref>), while we found 78, including 20 Type I and 58 Type II <italic>MADS-box</italic> genes (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S7</bold>
</xref>). A comparative analysis of the <italic>TCP</italic> genes in the Apiaceae family identified 29 genes in <italic>Apium graveolens</italic>, 43 in <italic>C. sativum</italic>, and 50 in <italic>Daucus carota</italic> (<xref ref-type="bibr" rid="B66">Pei et&#xa0;al., 2021</xref>), while we found 32, 45, and 50 members, respectively (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S7</bold>
</xref>). In line with this, we found 27&#x2013;41 <italic>TCP</italic> genes in the Asteraceae (with one exception of five genes in <italic>Erigeron breviscapus</italic>) and 31&#x2013;34 in the three <italic>Taraxacum</italic> species.</p>
<sec id="s3_1">
<label>3.1</label>
<title>Unique patterns of gene family expansion and loss of <italic>MIKC</italic>
<sup>c</sup> <italic>MADS-box</italic> and <italic>CYC/TB1 TCP</italic> genes in Asteraceae</title>
<p>After classification of the identified <italic>MADS-box</italic> genes, we found that the Asteraceae, represented by 12 species in our analysis, contained a lower number of Type I (on average 18.5) and Type II <italic>MIKC</italic>* (on average 2.8) <italic>MADS-box</italic> genes as compared to the other selected eudicots (on average 41.8 Type I and 6.1 <italic>MIKC*</italic> genes; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S7</bold>
</xref>). In comparison to the Asteraceae, the Solanaceae, represented by five species in our study, have around four times as many Type I (on average 74.8) and Type II MIKC* (on average 11.0) <italic>MADS-box</italic> genes, which indicates a larger gene retention after its recent whole-genome triplication (WGT) (91&#x2013;52 Mya; <xref ref-type="bibr" rid="B75">Sato et&#xa0;al., 2012</xref>). Instead, the Asteraceae underwent a <italic>MADS-box</italic> Type II gene family expansion and retention after a WGT (from two successive rounds of paleopolyploidy; <xref ref-type="bibr" rid="B3">Barker et&#xa0;al., 2008</xref>; <xref ref-type="bibr" rid="B4">Barker et&#xa0;al., 2016</xref>), retaining more <italic>MIKC</italic>
<sup>c</sup> genes (on average 45.8) than the other eudicots (on average 36.4), such as in the Solanaceae (on average 37.2; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S7</bold>
</xref>). Thus, both the Solanaceae and Asteraceae show lineage-specific gene expansions and high levels of gene retention of Type I/Type II <italic>MIKC</italic>* and Type II <italic>MIKC</italic>
<sup>c</sup> <italic>MADS-box</italic> genes following a WGT, respectively (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>). These multiplicated copies might evolve into new functions; for example, in <italic>Gerbera</italic>, eight <italic>SEP</italic>-like <italic>GERBERA REGULATOR OF CAPITULUM DEVELOPMENT</italic> (<italic>GRCD</italic>) genes are present that individually show conserved, sub-functional, and neo-functional roles in floral organ development, in contrast to the four redundant copies in <italic>Arabidopsis</italic> (reviewed by <xref ref-type="bibr" rid="B24">Elomaa et&#xa0;al., 2018</xref>). Moreover, diverged expression patterns of the duplicated genes found in our study suggest a possible novelty in regulation or function (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3</bold>
</xref>&#x2013;<xref ref-type="fig" rid="f5">
<bold>5</bold>
</xref> and below).</p>
<p>A similar scenario of gene expansion was found for <italic>TCP</italic> Class II <italic>CYC</italic> genes (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>), where the Asteraceae (except for <italic>E. breviscapus</italic>) contained nearly twice as many <italic>CYC</italic> genes (on average 10.7) as compared to the non-Asteraceae (on average 5.9; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S7</bold>
</xref>). This extensive <italic>CYC</italic> duplication has been reported for many specific Asteraceae (sub)families (<xref ref-type="bibr" rid="B13">Chapman et&#xa0;al., 2008</xref>; <xref ref-type="bibr" rid="B37">Kim et&#xa0;al., 2008</xref>; <xref ref-type="bibr" rid="B86">Tahtiharju et&#xa0;al., 2012</xref>; <xref ref-type="bibr" rid="B32">Huang et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B15">Chen et&#xa0;al., 2018</xref>), including Senecioneae (<italic>Senecio</italic>), Mutisieae (<italic>Gerbera</italic>), Asteroideae/Heliantheae (sunflower), and Asteroideae/Anthemideae (<italic>Chrysanthemum</italic>). Our study further supports the duplication of <italic>CYC</italic> genes in the Cichorioideae, represented by dandelion and lettuce, and Carduoideae, represented by cardoon and safflower, reiterating a whole-family duplication event of the <italic>CYC</italic> clade. Moreover, the regulatory function of duplicated <italic>CYC</italic> genes for Asteraceae ray floret development reported for <italic>Gerbera</italic> and sunflower can be assigned to different copies in the <italic>CYC</italic>2 clade (<xref ref-type="bibr" rid="B13">Chapman et&#xa0;al., 2008</xref>; <xref ref-type="bibr" rid="B86">Tahtiharju et&#xa0;al., 2012</xref>), while the loss of one of the <italic>CYC</italic>2 genes (<italic>CYC</italic>2d) was found associated with the formation of ligulate florets (Cichorioideae; <xref ref-type="bibr" rid="B15">Chen et&#xa0;al., 2018</xref>). In our phylogeny (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S8</bold>
</xref>), we also classified the <italic>CYC</italic> genes based on the study from <xref ref-type="bibr" rid="B86">Tahtiharju et&#xa0;al. (2012)</xref>, using reference genes of <italic>Arabidopsis</italic>. The classified <italic>CYC</italic>2 clade contains two genes from <italic>T. officinale</italic>, Toff_WURv1_g24074, and Toff_WURv1_g36520, and the high expression of Toff_WURv1_g36520 in the young floral tissues, before fertilization (stages 0&#x2013;2), suggests a role in the regulation and development of the formation of ligulate florets in dandelion, while Toff_WURv1_g24074 was not expressed during floral development (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S10</bold>
</xref>). Genes from other Asteraceae species in the <italic>CYC</italic>2 clade should also be checked experimentally to determine their function in floral organ identity (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S8</bold>
</xref>).</p>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Lineage-specific gene loss and genomic context of <italic>MADS-box</italic> and <italic>TCP</italic> genes</title>
<p>Our phylogeny shows that the <italic>AGAMOUS</italic>-like (<italic>AG</italic>-like) clade of <italic>MADS-box</italic> genes also contains <italic>SHATTERPROOF</italic> (<italic>SHP</italic>) and <italic>SEEDSTICK</italic> (<italic>STK</italic>) (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>, represented by CL2 and CL3&#x2013;5 respectively; see also <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3A</bold>
</xref>), agreeing with their close relationship in previous phylogenies and classifications (<xref ref-type="bibr" rid="B87">Theissen et&#xa0;al., 2000</xref>). In the model plant <italic>Arabidopsis thaliana</italic>, <italic>SHP</italic> and <italic>STK</italic> are both involved in ovule/fruit development: <italic>SHP</italic> can activate an <italic>AG</italic>-independent carpel developmental pathway and subsequently control fruit dehiscence for seed dispersal (<xref ref-type="bibr" rid="B47">Liljegren et&#xa0;al., 2000</xref>; <xref ref-type="bibr" rid="B69">Pinyopich et&#xa0;al., 2003</xref>), and <italic>STK</italic> regulates the development of the funiculus to connect the seed to the ovary wall/placenta (<xref ref-type="bibr" rid="B69">Pinyopich et&#xa0;al., 2003</xref>). Interestingly, our phylogenomic results reveal that the <italic>SHP</italic>-type (CL2) is absent from all Asteraceae species analyzed, while it is present in most other angiosperms (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3A</bold>
</xref>), and the <italic>STK</italic> type of the Asteraceae (CL4; <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>) is primarily located in a different genomic context than in the other angiosperms (CL3). In a previous phylogeny of eudicot <italic>MADS-box</italic> genes, the <italic>PLENA</italic> (<italic>PLE</italic>) lineage of clustered <italic>SHP</italic>s lacked proteins from the Asteraceae, confirming that <italic>SHP</italic> genes are missing in this family (<xref ref-type="bibr" rid="B23">Dreni and Kater, 2014</xref>). Compared to the Brassicaceae (<italic>Arabidopsis</italic>), the observed absence of <italic>SHP</italic> and presence of specific <italic>STK</italic> copies potentially could be linked to the Asteraceae unique mode of seed dispersal by wind or animals through the pappus (<xref ref-type="bibr" rid="B35">Jana and Mukherjee, 2012</xref>) rather than <italic>via</italic> shattering (<xref ref-type="bibr" rid="B47">Liljegren et&#xa0;al., 2000</xref>). This may suggest that diversification into <italic>SHP</italic> has not occurred in the Asteraceae or has become lost, although some type of dehiscence still occurs in the Asteraceae to release the cypsela from the receptacle. The <italic>STK</italic> transposition might have influenced the fruit differences, such as the formation of single integument ovules and single seed ovaries in Asteraceae versus the double integument ovules and multiple seed-containing ovaries in the Brassicaceae, which need further validation.</p>
<p>
<italic>SEP</italic>-like (class E) genes are essential regulators that orchestrate the formation of different floral organs in combination with the other ABC(D) genes (<xref ref-type="bibr" rid="B89">Thei&#xdf;en et&#xa0;al., 2016</xref>). The <italic>SEP</italic>-like genes can be divided into the <italic>SEP</italic>1/2/4 clade and the <italic>SEP</italic>3 clade in <italic>Arabidopsis</italic>, where <italic>SEP</italic>3 has been shown to co-regulate the activation of B and C class <italic>MADS-box</italic> genes, being involved in all floral organs but the sepals (<xref ref-type="bibr" rid="B67">Pelaz et&#xa0;al., 2000</xref>; <xref ref-type="bibr" rid="B72">Rijpkema et&#xa0;al., 2010</xref>). In <italic>Gerbera</italic>, eight <italic>SEP</italic>-like genes are found, the GRCD genes of which <italic>GRCD</italic>4 and <italic>GRCD</italic>5 co-regulate with the B class genes and <italic>GRCD</italic>1 and <italic>GRCD</italic>2 with the C class genes in petal end stamen and carpel formation, respectively, showing an expansion and sub-functionalization of the <italic>SEP</italic>3 function in this Asteraceae species (<xref ref-type="bibr" rid="B104">Zhang et&#xa0;al., 2017</xref>). We found that also in other Asteraceae (represented by 12 species of three subfamilies), gene duplication of <italic>SEP</italic>3 lineage genes is present and revealed one Asteraceae-dominant clade of <italic>SEP</italic>3 genes with lineage-specific synteny (CL7) compared to a conserved synteny shared by the other angiosperms (CL6; <xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3</bold>
</xref>, <xref ref-type="fig" rid="f4">
<bold>4B</bold>
</xref>, <xref ref-type="fig" rid="f5">
<bold>5A</bold>
</xref>). <italic>T. officinale</italic> has two <italic>SEP</italic>3 genes with a complete Type II structure, one in each cluster (To_SEP3_CL6_1 and To_SEP3_CL7_1 in <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4B</bold>
</xref>). The similar expression of the two <italic>SEP</italic>3-like genes in <italic>T. officinale</italic> does not hint at a divergence in function; however, considering the diverse functions of <italic>SEP</italic>3-like genes in <italic>Gerbera</italic> (reviewed by <xref ref-type="bibr" rid="B24">Elomaa et&#xa0;al., 2018</xref>), it will be interesting to examine patterns of neo- and sub-functionalization of different <italic>SEP</italic>3 copies also in <italic>T. officinale</italic>, as well as the potential effect caused by a positional change (i.e., their different syntenies).</p>
<p>Although <italic>CYC</italic> genes are the typical <italic>TCP</italic> genes of interest for their control of flower symmetry (<xref ref-type="bibr" rid="B51">Luo et&#xa0;al., 1996</xref>), we also included the other class of <italic>TCP</italic> genes in our analysis, <italic>PCF</italic> genes, and we found an Asteraceae-specific synteny of these genes (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3</bold>
</xref>, <xref ref-type="fig" rid="f4">
<bold>4C</bold>
</xref>, CL15). Overall, we found a syntenic depth of three for <italic>PCF</italic> genes, which is likely derived and retained from the ancient &#x3b3; WGT shared by the eudicots. Compared to the function of the <italic>CYC</italic> genes, <italic>PCF</italic> genes (<italic>PCF</italic>1 and <italic>PCF</italic>2) were first defined in rice and found to regulate the expression of meristematic tissues primarily <italic>via</italic> heterodimers (<xref ref-type="bibr" rid="B39">Kosugi and Ohashi, 1997</xref>). Finding an Asteraceae-specific synteny of <italic>PCF</italic> genes might, therefore, imply that they evolved a unique role in aspects of Asteraceae meristem development. The different expression of the two <italic>PCF</italic> genes in <italic>T. officinale</italic>, To_PCF_CL12_1 and To_PCF_CL15_1 (cartoon in <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4C</bold>
</xref>), implies a functional or regulatory novelty. Further analysis of these genes and a test of their <italic>cis</italic>-regulatory elements to examine whether PCF_CL15 has evolved a regulatory novelty under the Asteraceae-specific genomic context could shed more light on this specific finding.</p>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Origin and revised classification of <italic>AS-MADS</italic> gene</title>
<p>
<italic>Asteraceae-specific MADS-box</italic> gene (<italic>AS-MADS</italic>) was recently described by <xref ref-type="bibr" rid="B102">Won et&#xa0;al. (2021)</xref>, who identified a monophyletic clade comprising multiple <italic>AS-MADS</italic> copies from <italic>Chrysanthemum</italic> and one copy from lettuce. The single lettuce copy (<italic>LsMADS</italic>16) was earlier found to be in the <italic>FLC</italic>-like clade (<xref ref-type="bibr" rid="B61">Ning et&#xa0;al., 2019</xref>). In this study, we identified a monophyletic clade of <italic>AS-MADS</italic> genes anchored by <italic>LsMADS</italic>16 (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5B</bold>
</xref>, indicated with a black dot). Surprisingly, the <italic>AS-MADS</italic> clade also contains genes from coriander and kiwi (Apiaceae as Asteraceae outgroup and basal Asterid; both indicated in <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5C</bold>
</xref> phylogenetic tree) and grape (basal rosid) in addition to those in the Asteraceae. Our phylogenomic analysis also demonstrated that <italic>AS-MADS</italic> and <italic>FLC</italic> share the same common ancestor and are both syntenic to <italic>SEP</italic>3 (<xref ref-type="fig" rid="f5">
<bold>Figures&#xa0;5A, B</bold>
</xref>). The previous study proved that <italic>FLC</italic> shares the same ancestor with <italic>SEP</italic> before the ancient tandem duplication event in seed plants (<xref ref-type="bibr" rid="B74">Ruelens et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B29">Gramzow et&#xa0;al., 2014</xref>). Based on our phylogenomic analysis, we propose that <italic>AS-MADS</italic> is also derived from the same ancestral gene of <italic>SEP</italic> and <italic>FLC</italic> (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5B</bold>
</xref>, visualized as copy 2). Moreover, the synteny of <italic>AS-MADS</italic> is maintained in one single cluster comprised of Asteraceae species and other eudicots, which indicates that this synteny has been retained for <italic>AS-MADS</italic> at least since the last common ancestor of the eudicots. Furthermore, <italic>FLC</italic> was found in a more ancestral species, <italic>A. trichopoda</italic> (basal angiosperm); hence, its paralog <italic>AS-MADS</italic> could also diverge from the ancient &#x3b6; WGD (i.e., shared by all angiosperms) after the <italic>SEP</italic>3&#x2013;<italic>TM</italic>8 tandem arose in the ancient flower plant ancestor. In summary, our results anticipated that the <italic>Asteraceae-specific MADS</italic> is a paralog of <italic>FLC</italic> and has a more ancient origin than previously thought but is prevalently reserved to the Asteraceae compared to other eudicots.</p>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Expression patterns of lineage-specific genes suggest specialized functions/novel regulation in floral development</title>
<p>By combining phylogeny and synteny information, we have validated and expanded gene family classifications and the identification of orthologous relationships between genes in conserved and lineage-specific genomic contexts (<xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;4</bold>
</xref>, <xref ref-type="fig" rid="f5">
<bold>5</bold>
</xref>). Based on phylogenomic analyses, we further examined the expression of genes that we found associated with the Asteraceae, including <italic>STK</italic>-like, <italic>SEP</italic>3-like, <italic>PCF</italic>-like, and <italic>AS-MADS</italic> genes, using our <italic>T. officinale</italic> genome and floral transcriptome data as references. We found a diverse pattern of expression (<xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;4</bold>
</xref>, <xref ref-type="fig" rid="f5">
<bold>5D</bold>
</xref>, and <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S7</bold>
</xref>). The <italic>STK</italic> copy in <italic>T. officinale</italic>-specific synteny (To_STK_CL5_1) has a partial expression pattern of another copy in Asteraceae-specific synteny (To_STK_CL4_1), implying a potential sub-functionalization event. For <italic>SEP</italic>3, the expression pattern of the <italic>T. officinale</italic> copy in the Asteraceae-specific context is highly similar to the second copy in the conserved synteny with other angiosperms, which indicates a conserved function. Unlike <italic>SEP</italic>3, the two closely related <italic>T. officinale PCF</italic> genes showed a different expression during floral development, which indicates a potential regulatory novelty after gene transposition. In <italic>Phalaenopsis</italic> species, <italic>PCF</italic> genes were found to co-express with other transcription factors like <italic>MADS-box</italic> (e.g., <italic>AP</italic>3, <italic>PI</italic>, and <italic>SEP</italic>3) and <italic>MYB</italic> (e.g., <italic>TCP</italic>) genes in buds, callus, and gynostemium (<xref ref-type="bibr" rid="B70">Pramanik et&#xa0;al., 2020</xref>). A similar balancing role might be true for either one of the <italic>PCF</italic> copies. For <italic>AS-MADS</italic>, the one <italic>T. officinale</italic> copy has a different expression pattern than the other nine <italic>FLC</italic> copies, which is highly expressed in the young bud (F0S0 and S1). This result suggests the specialization of <italic>AS-MADS</italic> genes as a separate subclade of the <italic>MIKC</italic>
<sup>c</sup> type.</p>
</sec>
<sec id="s3_5">
<label>3.5</label>
<title>Concluding remarks</title>
<p>We sequenced the genome and transcriptome of the common dandelion. While the genome assembly is fragmented as compared to genomes based on the latest long-read sequencing methods, it has good completeness in terms of both assembly and annotation. The work presented in our study shows the usefulness of the <italic>de novo</italic> genome and floral transcriptomes of <italic>T. officinale</italic> for unraveling aspects of the evolutionary history of the Asterids, Asteraceae, Cichorioideae, and/or <italic>Taraxacum</italic>. Combining these <italic>de novo</italic> genome sequences with genomic data of other Asterids, we systematically studied the two most important gene families related to floral development, the <italic>MADS-box</italic> and <italic>TCP</italic> genes, and revealed a handful of interesting, Asteraceae (sub)family-related uniqueness. Future high-quality genome assemblies of other Asteraceae species can facilitate and validate our conclusions about <italic>MADS-box</italic> and <italic>TCP</italic> contribution to Asteraceae floral evolution. We also validated gene expression in lineage-specific synteny or phylogeny (<italic>AS-MADS</italic>) using referenced-based mapping on our <italic>T. officinale</italic> genome. Validation of the gene expression in other Asteraceae by comparison to data from literature was inconclusive and needs investigation in a single study with various species for which the present study provides interesting guidelines. In addition to the different floral states, <italic>T. officinale</italic> material from the inflorescence meristem stages would be interesting to sequence to further explore the function of <italic>MADS-box</italic> and <italic>TCP</italic> yet highlighted in this paper.</p>
</sec>
</sec>
<sec id="s4" sec-type="materials|methods">
<label>4</label>
<title>Material and methods</title>
<sec id="s4_1">
<label>4.1</label>
<title>Plant material</title>
<p>The common dandelion accession sequenced is a sexual diploid member of a dandelion population in France near the village of Ch&#xe2;tillon, Jura (FCh72; population F3 in <xref ref-type="bibr" rid="B94">Verhoeven and Biere, 2013</xref>). It was grown from a field-collected seed and maintained in the greenhouse <italic>via</italic> cuttings, under 16/8-h light/dark conditions, frost-free, and a maximum temperature of 20&#xb0;C. FCh72 is a plant with 2<italic>n</italic> = 2<italic>x</italic> = 16 chromosomes and an estimated genome size of 831 Mb (<xref ref-type="bibr" rid="B22">Dole&#x17e;el and Barto&#x161;, 2005</xref>).</p>
</sec>
<sec id="s4_2">
<label>4.2</label>
<title>DNA preparation</title>
<p>One of the cuttings of plant FCh72 was placed in the dark (etiolated) for 3 days, after which young leaves were harvested, the largest veins were removed, and the remainder were frozen in liquid N<sub>2</sub> and stored at &#x2212;80&#xb0;C. DNA extraction was performed according to the cetyltrimethylammonium bromide (CTAB) method by <xref ref-type="bibr" rid="B12">Chang et&#xa0;al. (1993)</xref> with minor modification, while care was taken in all steps to keep the high-molecular-weight (HMW) DNA. In brief, a total of 2&#x2013;3-g leaf material was grounded in liquid N<sub>2</sub>, the DNA was extracted in pre-warmed CTAB buffer at 65&#xb0;C for 1 h, and the DNA was purified <italic>via</italic> two subsequent chloroform extractions and then precipitated using 0.7 volumes of isopropanol (4&#xb0;C overnight). Pellets were resuspended in 450 &#xb5;l of RNase- and DNase-free MilliQ water (MQ), and the RNA was removed by an RNase treatment with 50 Units RNaseOne&#x2122; Ribonuclease (Promega, Madison, WI, USA). An equal volume of sodium chloride&#x2013;Tris-EDTA (SSTE) 2&#xd7; buffer was added, a third chloroform extraction was performed, and the DNA precipitation was in ethanol. DNA pellets were dissolved in MQ, and the concentration and quality were examined on a NanoDrop 2000 (Thermo Scientific, Waltham, MA, USA) and Qubit 2.0 (Invitrogen, Life Technologies, Carlsbad, CA, USA), with the latter using the dsDNA HS assay (Invitrogen, Life Technologies). A total of 40 &#xb5;g of HMW DNA was prepared for PacBio and Illumina library preparations for sequencing.</p>
</sec>
<sec id="s4_3">
<label>4.3</label>
<title>RNA preparation</title>
<p>To facilitate gene annotation, a mix of RNA from <italic>T. officinale</italic> flower, bud, leaf, and root tissues was prepared. Tissues were collected from cuttings of the mentioned plant FCh72 over different days, depending on tissue availability. The largest veins were removed from the leaves, and the roots were quickly rinsed with MQ, after which the tissues were frozen in liquid N<sub>2</sub> and stored at &#x2212;80&#xb0;C. Total RNAs were extracted from each of the tissue types separately following the TRIzol reagent (Invitrogen) method with the adjustments by <xref ref-type="bibr" rid="B25">Ferreira de Carvalho et&#xa0;al. (2016)</xref>. RNAs were treated with DNAse (Turbo DNA free&#x2122; kit; Ambion, Austin, TX, USA) according to the manufacturer&#x2019;s protocol. The RNA integrity and concentration were checked on a NanoDrop 2000 and by examining the 25S:18S quality and ratio on a 1% agarose gel. Samples were then pooled to equimolar concentrations, and a total of 1.5 &#xb5;g of RNA was prepared for Illumina library preparation.</p>
<p>For floral expression analysis, RNAs from <italic>T. officinale</italic> flower buds and heads at different developmental stages were harvested from cuttings of plant FCh72, with the younger stages (stages 0, 1, and 2) in triplicate and the older stages (stages 3 and 7) as duplicates. Harvesting was performed over different days, depending on tissue availability. The samples included very young, whole buds (F0S0; initiating organs, stem ~0 cm; a mix of three buds) and buds and heads of older stages separated through the beaks in upper (F; organs in all four floral whorls) and lower (S; the inner floral whorl/ovary/seed) floral parts: mature buds (F1 and S1; organs determined and elongated, stem ~10 cm), open flowers (F2 and S2) and old flowers (F3 and S3; 3 days after pollination [DAP]), mature pappus (F7) and ripening seeds (S7; 7 DAP), and leaves (LF) (see for exact stage definitions and sample preparation <xref ref-type="bibr" rid="B99">Vijverberg et&#xa0;al., 2021</xref>). A total of 10&#x2013;40-mg tissue was collected for each sample, quickly prepared at room temperature, and then frozen in N<sub>2</sub>. Total RNAs were isolated using TRIzol reagent (Invitrogen, Life Technologies) as described above and dissolved in DEPC-MQ to a final concentration of 200 ng/&#xb5;l.</p>
</sec>
<sec id="s4_4">
<label>4.4</label>
<title>DNA and RNA sequencing</title>
<p>The <italic>Taraxacum</italic> genome was sequenced in three rounds by using a PacBio RSII sequencing system (Pacific Biosciences), 10X Genomics combined with Illumina HiSeq2500 125 paired-end sequencing (Leiden, The Netherlands), and BioNano Genomics Technology. All library preparations and sequencing were performed by the sequencing facility of Wageningen University &amp; Research, The Netherlands. PacBio uses Single Molecule Real-Time (SMRT) sequencing technology, providing long reads averaging 10&#x2013;15 kb. The 10X Genomics method is droplet-based, enabling barcode-specific sequencing of small amounts of DNAs/single DNA strands, facilitating the haplotype detection and sequence assembly. The Illumina reads were also used to polish the sequences. Optical mapping by BioNano further improved the contig assembly.</p>
<p>The RNA library preparations and sequencing for gene annotation were performed at the same sequence facility at Wageningen University &amp; Research, using Illumina HiSeq2500 125-nt paired-end sequencing. The RNA library preparation and sequencing of samples of the floral expression analysis were performed at BaseClear BV (Leiden, The Netherlands), using Illumina NovaSeq 150-nt paired-end sequencing.</p>
</sec>
<sec id="s4_5">
<label>4.5</label>
<title>Genome assembly</title>
<p>We obtained PacBio reads with the mean subread length of 12,259 bp and a total length of 62,496,657,252 bp, corresponding to ~75&#xd7; coverage of the <italic>Taraxacum</italic> genome. In addition, we obtained ~161&#xd7; of Illumina 10X 150-nt paired-end reads. The PacBio subreads were assembled using Canu (version 1.3, corMaxEvidenceErate 0.15) (<xref ref-type="bibr" rid="B38">Koren et&#xa0;al., 2017</xref>). The resulting contig assembly was checked for contaminants using blobtools (v1.0) (<xref ref-type="bibr" rid="B42">Laetsch and Blaxter, 2017</xref>) and assessed for completeness with BUSCO (v5.2.2 using eudicot_odb10) (<xref ref-type="bibr" rid="B54">Manni et&#xa0;al., 2021</xref>). Assembly statistics were gathered using Quast (v5.02) (<xref ref-type="bibr" rid="B30">Gurevich et&#xa0;al., 2013</xref>). To collapse separately assembled haplo-contigs, the purge_dups manual protocol was followed. In brief, any contigs with assembly ambiguities were split using tigmint (v1.0.0) (<xref ref-type="bibr" rid="B34">Jackman et&#xa0;al., 2018</xref>), reads were mapped back to the split assembly using minimap2 (<xref ref-type="bibr" rid="B45">Li, 2018</xref>), and putative haplo-contigs were collapsed by purge_dups using coverage information. Internal joins in scaffolds by purge_dups were then split on all 22N recognition sequences. This assembly was then polished with two rounds of RACON (v1.4.11) (<xref ref-type="bibr" rid="B93">Vaser et&#xa0;al., 2017</xref>) using the original PacBio data. Next, the polished assembly was scaffolded with the Illumina 10X data using ARCS (v1.1.0) (<xref ref-type="bibr" rid="B103">Yeo et&#xa0;al., 2018</xref>). The assembly was further scaffolded with BioNano Irys data using hybrid scaffolding. In the final step, the assembly was polished with the 10X Illumina data using Pilon (v1.22) (<xref ref-type="bibr" rid="B100">Walker et&#xa0;al., 2014</xref>).</p>
</sec>
<sec id="s4_6">
<label>4.6</label>
<title>Repeat masking</title>
<p>Repetitive sequences and transposable elements (TEs) in the <italic>T. officinale</italic> genome were identified using a combination of <italic>de novo</italic> and homology-based approaches at the DNA level. <italic>De novo</italic>: RepeatModeler (v.2.0.1 with the LTRstruct option) was used to create a <italic>de novo</italic> repeat dataset (<xref ref-type="bibr" rid="B26">Flynn et&#xa0;al., 2020</xref>). The results from RepeatModeler were combined with the RepeatMasker combined data subset relevant for <italic>T. officinale</italic> (i.e., Viridiplantae) and used as input for RepeatMasker (open-4.0). The results from RepeatMasker were used to soft-mask the genome assembly prior to annotation (<xref ref-type="bibr" rid="B79">Smit et&#xa0;al., 2019</xref>).</p>
</sec>
<sec id="s4_7">
<label>4.7</label>
<title>Gene prediction and functional annotation</title>
<p>We employed the BRAKER2 (<xref ref-type="bibr" rid="B7">Br&#x16f;na et&#xa0;al., 2021</xref>) pipeline for <italic>ab initio</italic> gene prediction. First, stranded RNAseq data from four tissues were quality and adapter trimmed using Cutadapt (v1.11) (<xref ref-type="bibr" rid="B56">Martin, 2011</xref>). The trimmed reads were aligned against the assembly (sans mitochondrial scaffold) using STAR (v2.6.1c) (<xref ref-type="bibr" rid="B20">Dobin et&#xa0;al., 2013</xref>). The aligned reads were separated into forward and reverse reads for BRAKER2 stranded mode. The reads were used as input for BRAKER2, together with the soft-masked reference. The BRAKER2 RNA evidence-based pipeline uses GeneMark-ET (<xref ref-type="bibr" rid="B50">Lomsadze et&#xa0;al., 2014</xref>) to generate initial gene structures using transcript support from RNAseq alignment. Next, AUGUSTUS (<xref ref-type="bibr" rid="B81">Stanke et&#xa0;al., 2008</xref>) uses the filtered predicted genes for parameter training and then integrates RNAseq information as extrinsic evidence into final gene predictions. For functional annotation and filtering, the transcript sequences predicted by BRAKER2 were extracted using gffread (<xref ref-type="bibr" rid="B68">Pertea and Pertea, 2020</xref>) and converted to protein sequences using EMBOSS transeq (v6.6.0; <xref ref-type="bibr" rid="B71">Rice et&#xa0;al., 2000</xref>). To identify homologous sequences, we used DIAMOND (<xref ref-type="bibr" rid="B8">Buchfink et&#xa0;al., 2021</xref>) blastp (v2.0.7, &#x201c;-b 10 &#x2013;c1 &#x2013;outfmt 5 &#x2013;sensitive&#x201d;) against nr (downloaded 06-03-2021). In addition, we analyzed the transcripts with InterProScan (v5.50-84.0) (<xref ref-type="bibr" rid="B36">Jones et&#xa0;al., 2014</xref>). Protein sequences, blast output, and InterProScan results were then imported into Blast2Go (<xref ref-type="bibr" rid="B16">Conesa et&#xa0;al., 2005</xref>) Basic (v5.2.5) and annotated with gene names and GO terms following the standard annotation pipeline. The resulting annotation was exported as gff3 file and subsequently formatted, filtered, and annotated using custom scripts. Mainly, transcripts shorter than 150 aa without homologous evidence were removed, duplicated transcripts marked in the Note field with &#x201c;Sequence identical to:&#x201d; and transcripts with more than 99% aa identity were labeled with &#x201c;Protein &gt;99 perc identical to:&#x201d; followed by the matching gene identifiers. Genes were relabeled in order of appearance on the assembly.</p>
</sec>
<sec id="s4_8">
<label>4.8</label>
<title>Genome comparison</title>
<p>We aligned our assembly with those of <italic>T. mongolica</italic> and <italic>T. kok-saghy</italic>z using minimap2 (v2.24-r1122: -x asm5 -K 4g &#x2013;cap-kalloc=2000m -t 16) and visualized the outcome in a dot plot using Dotplotly (-s -t -m 5000 -q 50000 -k 40-x). We ran BUSCO (v5.2.2 with using eudicots_odb10) on three transcriptomes to compare genome quality (see also section below).</p>
</sec>
<sec id="s4_9">
<label>4.9</label>
<title>Genome database</title>
<p>Plant whole-genome sequences of 33 species were selected for synteny network and phylogenomic analysis, including species of the two large, derived crown groups of the Asteraceae (Cichorioideae (covering <italic>Taraxacum</italic>) and Asteroideae), two species of a basal subfamily (Carduoideae) four none-Asteraceae Asterid II members, 11 species from the Asterid I clade, four early-diverging Asterids, two species of the Rosids, and the basal <italic>A. trichopoda</italic> (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S5</bold>
</xref>). Among them, 14 were retrieved from <xref ref-type="bibr" rid="B107">Zhao and Schranz (2019)</xref>, 19 from more recent studies (mainly Asteraceae), and one <italic>de novo</italic> sequenced in this study (<italic>T. officinale</italic>). The protein sequences of primary transcripts and corresponding gene positions were extracted from selected genomes for downstream phylogenic and syntenic analyses. BUSCO (v5.2.2) was used to assess the completeness of proteomes using the eudicots_odb10 dataset.</p>
</sec>
<sec id="s4_10">
<label>4.10</label>
<title>Identification and classification of <italic>MADS-box</italic> and <italic>TCP</italic> genes</title>
<p>For <italic>MADS-box</italic> genes, HMMER (v3.3.2) was used to search for the <italic>MADS-box</italic> (PF00319.20) and <italic>K-box</italic> (PF01486.20) domains in all amino acid (aa) sequences of all 33 species, with a default cutoff using the profiles of hidden Markov models (HMMs) collected from pfam (<xref ref-type="bibr" rid="B57">Mistry et&#xa0;al., 2013</xref>). To classify the identified <italic>MADS-box</italic> candidates, a reference database of 162 <italic>MADS-box</italic> genes was prepared, including 107 from <italic>A. thaliana</italic>, 32 from <italic>Petunia hybrida</italic>, 21 from <italic>Gerbera hybrida</italic>, one from <italic>Solanum lycopersicum</italic> (tomato) (TM8), and one <italic>Asteraceae-specific MADS-box</italic> gene (<italic>AS-MADS</italic>) from <italic>Lactuca sativa</italic> (lettuce) (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S6</bold>
</xref>). To quickly classify the sub-families of the identified <italic>MADS-box</italic> genes, BLAST (v2.12.0) was applied to search for the best match of each candidate using aa sequence encoded by the reference genes as the database with default cutoff.</p>
<p>For <italic>TCP</italic> genes, 53 classified genes were collected, including 24 from <italic>A. thaliana</italic>, 26 from <italic>Oryza sativa</italic> (rice), two from <italic>A. majus</italic> (Garden snapdragon), and one from <italic>Zea mays</italic> (maize). The source of the sequence data from this section can be found in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S6</bold>
</xref>. HMMER was used to search for the <italic>TCP</italic> domain (PF03634.15) in 33 proteomes with the default setting. To further classify the <italic>TCP</italic> homologs, BLAST (v2.12.0) was applied to search for the best match for each candidate using the reference genes as a database.</p>
</sec>
<sec id="s4_11">
<label>4.11</label>
<title>Synteny network analysis</title>
<p>Complete synteny networks of proteomes for the 33 plant species were created by the SynNet-Pipeline from (<xref ref-type="bibr" rid="B106">Zhao and Schranz, 2017</xref>; <ext-link ext-link-type="uri" xlink:href="https://github.com/zhaotao1987/SynNet-Pipeline">https://github.com/zhaotao1987/SynNet-Pipeline</ext-link>). In this pipeline, Diamond (v2) was applied to conduct the whole-genome protein comparison (<xref ref-type="bibr" rid="B9">Buchfink et&#xa0;al., 2015</xref>). Then, MCScanX was used to detect the syntenic blocks (minimum homologs = 6 genes, max gaps =25 genes), and the output was merged into the synteny network database (<xref ref-type="bibr" rid="B101">Wang et&#xa0;al., 2012</xref>). The syntenic connections of identified <italic>MADS-box</italic> and <italic>TCP</italic> genes were extracted from the synteny network (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Data S2</bold>
</xref>). Then, extracted sub-networks were further clustered (i.e., cut into small networks) by the Infomap algorithm in R (<xref ref-type="bibr" rid="B73">Rosvall and Bergstrom, 2008</xref>). Clustered synteny networks were visualized in CYTOSCAPE (v3.7.1) (<xref ref-type="bibr" rid="B76">Shannon et&#xa0;al., 2003</xref>). Next, phylogenomic profiles were built by quantifying syntenic genes per syntelog (syntenic homolog) cluster in all 33 species. Subsequently, hierarchical clustering (ward.D) was performed to re-order the synteny clusters using the Jaccard index. To study the genomic context of interesting genes, clusters were annotated by their primary syntelog(s) (&gt;10% composition). Clusters were determined as Asteraceae-specific if more than 80% of the syntelogs were from Asteraceae species. The 80% cutoff instead of 100% was selected to maintain the evidence of closely related species that shared the same WGD or WTD events with the Asteraceae.</p>
</sec>
<sec id="s4_12">
<label>4.12</label>
<title>Expression analysis</title>
<p>Analysis of gene expression and visualization thereof was performed by using CLC-Genomic Workbench (CLC-GW, v20; Qiagen), Excel, and R (v4.0; The R Foundation). For 13 <italic>MADS-box</italic> and 5 <italic>TCP</italic> genes, they were represented by two alleles (i.e., due to assembly in two haplo-contigs), identified by sequence similarity, partiality of some gene(s), flanking sequences, and expression pattern. The maximum distance between paired reads was set to 2,000 nt; raw sequence reads were trimmed on quality (0.05), ambiguity (2nt), adapters, and length (&gt;30 nt); and both paired and broken pairs were saved for mapping. Samples with high read numbers were sampled back to 60 M single reads by using the &#x201c;Random sampling&#x201d; tool. Read mapping was performed to the annotated <italic>Taraxacum</italic> genome, including all genes of length 150 nt and longer, using the &#x201c;RNAseq analysis&#x201d; tool and the following settings: Mismatch cost = 2, Insertion cost = 3, Deletion cost = 3, Length fraction = 0.5, and Similarity fraction = 0.9. Three expression values were collected: TERs, UGRs, and Unique Exon Reads (UERs). For measuring the UGRs, all genes were extended with an extra 400 nt up- and downstream of the genes to ensure including the reads that map partly or entirely in the 5&#x2032;- and 3&#x2032;-UTRs in the counts. For the final analysis and heatmaps, Total Exon Reads were used after normalization to Transcripts Per Million (TPM) in CLC-GW. The data were checked for quality using principal component analysis (PCA) and a heatmap, using the &#x201c;PCA for RNAseq&#x201d; and &#x201c;Create heatmap for RNAseq&#x201d; tools, respectively, with the latter based on Euclidean distances and complete cluster linkage. In the heatmap, stage(s)- and tissue(s)-related &#x201c;expression blocks&#x201d; were defined manually, and the corresponding &#x201c;block&#x201d; numbers were added to the genes involved. The data were then exported to Excel, and the overall expression pattern was analyzed by summing the TERs and UGRs (in TPM) over all 25 samples for each gene. Summed expressions were classified into seven groups from &#x201c;true zero&#x201d; to &#x201c;extremely high&#x201d; expression (&gt;10,000 TPM), and ratios were compared, with higher TERs explained by the total versus unique mapping of reads and higher UGRs by mapping of reads to introns and 400-nt untranslated regions (UTRs) in addition to the exons. Read values were then averaged over replicates. For this, the raw values were transformed to reads per ten million (RP10M) and averaged (AvTERs), and then the averaged values were transformed to TP10M. Subsequently, the Minimum (MIN), Maximum (MAX), Range (MAX-MIN), and Ratio (MAX/MIN) were calculated over the nine floral-related tissue types, excluding the leaf sample, for each gene. In the cases in which MIN = 0, the ratio was based on the lowest non-0 value and the number of samples without expression indicated. Heatmaps of subsets of genes were calculated based on the averaged values after excluding all non-expressed genes (MAX &lt; 5) transformation to Log2(AvTER +1), using Heatmaply in R, with the subsets of genes of interest: <italic>MADS-box</italic> genes and <italic>TCP</italic> genes.</p>
</sec>
<sec id="s4_13">
<label>4.13</label>
<title>Phylogeny reconstruction of identified genes</title>
<p>For both <italic>MADS-box</italic> and <italic>TCP</italic> genes, the protein sequences of all identified homologs were aligned based on their domains&#x2019; HMM (PF00319.20 and PF03634.15) using HmmerAlign (<xref ref-type="bibr" rid="B41">Kristensen et&#xa0;al., 2011</xref>). Next, PAL2NAL (v14) was used to convert the protein alignments back to codon alignment, and the codon alignments of <italic>MADS-box</italic> and <italic>TCP</italic> genes were trimmed by TrimAl (v1.4.1) using -automated1 and -gappyout mode, respectively (<xref ref-type="bibr" rid="B85">Suyama et&#xa0;al., 2006</xref>; <xref ref-type="bibr" rid="B10">Capella-Guti&#xe9;rrez et&#xa0;al., 2009</xref>). RAxML phylogenetic trees were constructed for both gene families by IQ-TREE (v1.6.2) with 1,000 ultrafast bootstrap (UFBoot) replicates to assess the final tree topology (<xref ref-type="bibr" rid="B60">Nguyen et&#xa0;al., 2015</xref>). For <italic>MADS-box</italic> genes, the best-fit model GTR+F+ASC+R10 was used by IQ-TREE (-pers 0.1, -nm 500) for 10 independent runs. For <italic>TCP</italic> genes, the best-fit model GTR+F+R6 was used by IQ-TREE to infer the phylogeny (default for other options). The consensus tree was annotated and visualized by iTOL (v6) (<xref ref-type="bibr" rid="B44">Letunic and Bork, 2021</xref>).</p>
<p>To better identify and classify the Type II type <italic>MADS-box</italic> genes, the K-box domains HMM (PF01486.20), identified by HMMER and curated by SMART, were selected and used, in addition to the MADS domain, for a second round of phylogeny reconstruction. The complete amino acid sequences were first aligned by MAFFT (v7.490) by the FFT-NS-2 strategy. Then, the protein alignment was converted back to codon alignment using PAL2NAL. Further, the residues shared by less than 5% (-gt 0.05) in alignment were trimmed by TrimAl (v1.4.1). In addition, the trimmed alignment was manually curated in Mesquite (v3.61). Finally, IQ-TREE (v1.6.12) was used to infer the maximum-likelihood trees using the GTR+F+ASC+R10 model with 1,000 ultrafast bootstrap (UFBoot) and SH-aLRT test replicates.</p>
</sec>
<sec id="s4_14">
<label>4.14</label>
<title>Synthesis of gene evolution</title>
<p>The evolutionary history of genes of interest was traced by comparative analysis of the syntenic versus gene sequence relationships by mapping the former on the phylogenetic gene trees. Identified lineage-specific genes within the Asteraceae were then checked for expression in the floral tissues of dandelion to support their diversification. After this, the genes were also checked for their expression in other Asteraceae based on data from the literature.</p>
</sec>
</sec>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>Genome and transcriptome sequence data of T. officinale is deposited in the ENA SRA database under accession nos. PRJEB58885 (genome assembly), PRJEB58886 (RNAseq data of mixed tissues) and PRJEB58887 (25 RNAseq files of floral tissues and 2 of leaves); Supplementary Data S1-S5 (large Excel files) can be found at: https://doi.org/10.4121/22262773.v1.</p>
</sec>
<sec id="s6" sec-type="author-contributions">
<title>Author contributions</title>
<p>KVi, MES, KVe, and IM conceived and designed the project, with previous contributions from JFC. KVi, CO, and MB generated the materials for genome and transcriptome sequencing. JR assembled and annotated the genome, with previous contributions from LB, TZ, and HG. WX performed the phylogeny and synteny analysis. KVi performed the analysis of the expression data. WX, JR, MES, and KVi interpreted the data and wrote the manuscript. All authors critically read and approved the manuscript.</p>
</sec>
</body>
<back>
<sec id="s7" sec-type="funding-information">
<title>Funding</title>
<p>This work was supported by grants from the Dutch Research Council of Applied and Engineering Sciences (NWO, TTW) #13700 (ParTool) to KVi, CO, MB, TZ, and MS; Dutch Research Council (NWO) #15315 to LB; and Chinese Scholarship Council (CSC) #201707720034 to WX.</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>We thank Elio Schijlen, Linda Bakker, Jan van Haarst (Bioscience, Wageningen University &amp; Research [WUR], Wageningen, The Netherlands), Rens Holmer (Bioinformatics, WUR) and Frank Becker (Genetics, WUR) for bioinformatics and technical assistance, and Clo&#xe9; Villard (Biosystematics, WUR), Wenhao Li (Biometris, WUR) and Xinyu Hu for advice on graphical design.</p>
</ack>
<sec id="s8" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s9" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2023.1198909/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2023.1198909/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet_1.pdf" id="SM1" mimetype="application/pdf"/>
<supplementary-material xlink:href="Table_1.xlsx" id="ST1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alvarez-Buylla</surname> <given-names>E. R.</given-names>
</name>
<name>
<surname>Pelaz</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Liljegren</surname> <given-names>S. J.</given-names>
</name>
<name>
<surname>Gold</surname> <given-names>S. E.</given-names>
</name>
<name>
<surname>Burgeff</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Ditta</surname> <given-names>G. S.</given-names>
</name>
<etal/>
</person-group>. (<year>2000</year>). <article-title>An ancestral <italic>MADS-box</italic> gene duplication occurred before the divergence of plants and animals</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>97</volume>, <fpage>5328</fpage>&#x2013;<lpage>5333</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.97.10.5328</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Anderberg</surname> <given-names>A. A.</given-names>
</name>
<name>
<surname>Baldwin</surname> <given-names>B. G.</given-names>
</name>
<name>
<surname>Bayer</surname> <given-names>R. G.</given-names>
</name>
<name>
<surname>Breitwieser</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Jeffrey</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Dillon</surname> <given-names>M. O.</given-names>
</name>
<etal/>
</person-group>. (<year>2007</year>).<article-title>&#x201c;Compositae,&#x201d;</article-title> in <source>Flowering plants eudicots</source>. Eds. <person-group person-group-type="editor">
<name>
<surname>Kadereit</surname> <given-names>J. W.</given-names>
</name>
<name>
<surname>Jeffrey</surname> <given-names>C.</given-names>
</name>
</person-group> (<publisher-loc>Berlin, Heidelberg</publisher-loc>: <publisher-name>Springer Berlin Heidelberg</publisher-name>), <fpage>61</fpage>&#x2013;<lpage>588</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-3-540-31051-8_7</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Barker</surname> <given-names>M. S.</given-names>
</name>
<name>
<surname>Kane</surname> <given-names>N. C.</given-names>
</name>
<name>
<surname>Matvienko</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Kozik</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Michelmore</surname> <given-names>R. W.</given-names>
</name>
<name>
<surname>Knapp</surname> <given-names>S. J.</given-names>
</name>
<etal/>
</person-group>. (<year>2008</year>). <article-title>Multiple paleopolyploidizations during the evolution of the compositae reveal parallel patterns of duplicate gene retention after millions of years</article-title>. <source>Mol. Biol. Evol.</source> <volume>25</volume>, <fpage>2445</fpage>&#x2013;<lpage>2455</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msn187</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Barker</surname> <given-names>M. S.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Kidder</surname> <given-names>T. I.</given-names>
</name>
<name>
<surname>Reardon</surname> <given-names>C. R.</given-names>
</name>
<name>
<surname>Lai</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Oliveira</surname> <given-names>L. O.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>Most compositae (Asteraceae) are descendants of a paleohexaploid and all share a paleotetraploid ancestor with the calyceraceae</article-title>. <source>Am. J. Bot.</source> <volume>103</volume>, <fpage>1203</fpage>&#x2013;<lpage>1211</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3732/ajb.1600113</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Becker</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Thei&#xdf;en</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>The major clades of <italic>MADS-box</italic> genes and their role in the development and evolution of flowering plants</article-title>. <source>Mol. Phylogenet. Evol.</source> <volume>29</volume>, <fpage>464</fpage>&#x2013;<lpage>489</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S1055-7903(03)00207-0</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brock</surname> <given-names>M. T.</given-names>
</name>
<name>
<surname>Weinig</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Galen</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>A comparison of phenotypic plasticity in the native dandelion taraxacum ceratophorum and its invasive congener t. officinale</article-title>. <source>New Phytol.</source> <volume>166</volume>, <fpage>173</fpage>&#x2013;<lpage>183</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1469-8137.2004.01300.x</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Br&#x16f;na</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Hoff</surname> <given-names>K. J.</given-names>
</name>
<name>
<surname>Lomsadze</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Stanke</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Borodovsky</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>BRAKER2: automatic eukaryotic genome annotation with GeneMark-EP+ and AUGUSTUS supported by a protein database</article-title>. <source>NAR Genomics Bioinforma.</source> <volume>3</volume>, <fpage>1</fpage>&#x2013;<lpage>11</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nargab/lqaa108</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Buchfink</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Reuter</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Drost</surname> <given-names>H. G.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Sensitive protein alignments at tree-of-life scale using DIAMOND</article-title>. <source>Nat. Methods</source> <volume>18</volume>, <fpage>366</fpage>&#x2013;<lpage>368</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41592-021-01101-x</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Buchfink</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Xie</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Huson</surname> <given-names>D. H.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Fast and sensitive protein alignment using DIAMOND</article-title>. <source>Nat. Methods</source> <volume>12</volume>, <fpage>59</fpage>&#x2013;<lpage>60</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nmeth.3176</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Capella-Guti&#xe9;rrez</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Silla-Mart&#xed;nez</surname> <given-names>J. M.</given-names>
</name>
<name>
<surname>Gabald&#xf3;n</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>trimAl: a tool for automated alignment trimming in large-scale phylogenetic analyses</article-title>. <source>Bioinformatics</source> <volume>25</volume>, <fpage>1972</fpage>&#x2013;<lpage>1973</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/BIOINFORMATICS/BTP348</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Carlquist</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>1976</year>) <source>Tribal interrelationships and phylogeny of the asteraceae</source>. Available at: <uri xlink:href="https://scholarship.claremont.edu/alisoAvailableat:https://scholarship.claremont.edu/aliso/vol8/iss4/10">https://scholarship.claremont.edu/alisoAvailableat:https://scholarship.claremont.edu/aliso/vol8/iss4/10</uri> (Accessed <access-date>October 11, 2022</access-date>).</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chang</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Puryear</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Cairney</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>1993</year>). <article-title>A simple and efficient method for isolating RNA from pine trees</article-title>. <source>Plant Mol. Biol. Rep.</source> <volume>11</volume>, <fpage>113</fpage>&#x2013;<lpage>116</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/BF02670468</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chapman</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Leebens-Mack</surname> <given-names>J. H.</given-names>
</name>
<name>
<surname>Burke</surname> <given-names>J. M.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Positive selection and expression divergence following gene duplication in the sunflower CYCLOIDEA gene family</article-title>. <source>Mol. Biol. Evol.</source> <volume>25</volume>, <fpage>1260</fpage>&#x2013;<lpage>1273</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msn001</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chase</surname> <given-names>M. W.</given-names>
</name>
<name>
<surname>Christenhusz</surname> <given-names>M. J. M.</given-names>
</name>
<name>
<surname>Fay</surname> <given-names>M. F.</given-names>
</name>
<name>
<surname>Byng</surname> <given-names>J. W.</given-names>
</name>
<name>
<surname>Judd</surname> <given-names>W. S.</given-names>
</name>
<name>
<surname>Soltis</surname> <given-names>D. E.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>An update of the angiosperm phylogeny group classification for the orders and families of flowering plants: APG IV</article-title>. <source>Bot. J. Linn. Soc</source> <volume>181</volume>, <fpage>1</fpage>&#x2013;<lpage>20</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/boj.12385</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Shen</surname> <given-names>C.-Z.</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>Y.-P.</given-names>
</name>
<name>
<surname>Rao</surname> <given-names>G.-Y.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Patterning the asteraceae capitulum: duplications and differential expression of the flower symmetry CYC2-like genes</article-title>. <source>Front. Plant Sci.</source> <volume>9</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2018.00551</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Conesa</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Gotz</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Garcia-Gomez</surname> <given-names>J. M.</given-names>
</name>
<name>
<surname>Terol</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Talon</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Robles</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Blast2GO: a universal tool for annotation, visualization and analysis in functional genomics research</article-title>. <source>Bioinformatics</source> <volume>21</volume>, <fpage>3674</fpage>&#x2013;<lpage>3676</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bti610</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>De Bodt</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Maere</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Van De Peer</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Genome duplication and the origin of angiosperms</article-title>. <source>Trends Ecol. Evol.</source> <volume>20</volume>, <fpage>591</fpage>&#x2013;<lpage>597</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.tree.2005.07.008</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dewey</surname> <given-names>C. N.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Positional orthology: putting genomic evolutionary relationships into context</article-title>. <source>Brief. Bioinform.</source> <volume>12</volume>, <fpage>401</fpage>&#x2013;<lpage>412</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bib/bbr040</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dezar</surname> <given-names>C. A.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Identification of three <italic>MADS-box</italic> genes expressed in sunflower capitulum</article-title>. <source>J. Exp. Bot.</source> <volume>54</volume>, <fpage>1637</fpage>&#x2013;<lpage>1639</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/jxb/erg163</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dobin</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Davis</surname> <given-names>C. A.</given-names>
</name>
<name>
<surname>Schlesinger</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Drenkow</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zaleski</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Jha</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2013</year>). <article-title>STAR: ultrafast universal RNA-seq aligner</article-title>. <source>Bioinformatics</source> <volume>29</volume>, <fpage>15</fpage>&#x2013;<lpage>21</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bts635</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Doebley</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Stec</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Hubbard</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>1997</year>). <article-title>The evolution of apical dominance in maize</article-title>. <source>Nature</source> <volume>386</volume>, <fpage>485</fpage>&#x2013;<lpage>488</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/386485a0</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Dole&#x17e;el</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Barto&#x161;</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Plant DNA flow cytometry and estimation of nuclear genome size</article-title>. <source>Ann. Bot.</source> <volume>95</volume>, <fpage>99</fpage>&#x2013;<lpage>110</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/aob/mci005</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dreni</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Kater</surname> <given-names>M. M.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>
<italic>MADS</italic> reloaded: evolution of the <italic>AGAMOUS</italic> subfamily genes</article-title>. <source>New Phytol.</source> <volume>201</volume>, <fpage>717</fpage>&#x2013;<lpage>732</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/nph.12555</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Elomaa</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Flower heads in asteraceae&#x2013;recruitment of conserved developmental regulators to control the flower-like inflorescence architecture</article-title>. <source>Hortic. Res.</source> <volume>5</volume>, <fpage>36</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41438-018-0056-8</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ferreira de Carvalho</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Oplaat</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Pappas</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Derks</surname> <given-names>M.</given-names>
</name>
<name>
<surname>de Ridder</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Verhoeven</surname> <given-names>K. J. F.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Heritable gene expression differences between apomictic clone members in taraxacum officinale: insights into early stages of evolutionary divergence in asexual plants</article-title>. <source>BMC Genomics</source> <volume>17</volume>, <fpage>203</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12864-016-2524-6</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Flynn</surname> <given-names>J. M.</given-names>
</name>
<name>
<surname>Hubley</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Goubert</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Rosen</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Clark</surname> <given-names>A. G.</given-names>
</name>
<name>
<surname>Feschotte</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>RepeatModeler2 for automated genomic discovery of transposable element families</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>117</volume>, <fpage>9451</fpage>&#x2013;<lpage>9457</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1921046117</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Folk</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Siniscalchi</surname> <given-names>C. M.</given-names>
</name>
<name>
<surname>Soltis</surname> <given-names>D. E.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Angiosperms at the edge: extremity, diversity, and phylogeny</article-title>. <source>Plant Cell Environ.</source> <volume>43</volume>, <fpage>2871</fpage>&#x2013;<lpage>2893</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/pce.13887</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Gamboa-Tuz</surname> <given-names>S. D.</given-names>
</name>
<name>
<surname>Pereira-Santana</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Schranz</surname> <given-names>M. E.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>&#x201c;Applying synteny networks (SynNet) to study genomic arrangements of protein-coding genes in plants,&#x201d;</article-title> in <source>Methods in molecular biology</source> (<publisher-loc>New York, NY:</publisher-loc> <publisher-name>Humana Press Inc</publisher-name>), <volume>2512</volume>, <fpage>199</fpage>&#x2013;<lpage>215</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-1-0716-2429-6_12</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gramzow</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Weilandt</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Thei&#xdf;en</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>MADS goes genomic in conifers: towards determining the ancestral set of <italic>MADS-box</italic> genes in seed plants</article-title>. <source>Ann. Bot.</source> <volume>114</volume>, <fpage>1407</fpage>&#x2013;<lpage>1429</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/aob/mcu066</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gurevich</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Saveliev</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Vyahhi</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Tesler</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>QUAST: quality assessment tool for genome assemblies</article-title>. <source>Bioinformatics</source> <volume>29</volume>, <fpage>1072</fpage>&#x2013;<lpage>1075</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btt086</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Henschel</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Kofuji</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Hasebe</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Saedler</surname> <given-names>H.</given-names>
</name>
<name>
<surname>M&#xfc;nster</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Thei&#xdf;en</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Two ancient classes of <italic>MIKC</italic>-type <italic>MADS-box</italic> genes are present in the moss <italic>Physcomitrella</italic> patens</article-title>. <source>Mol. Biol. Evol.</source> <volume>19</volume>, <fpage>801</fpage>&#x2013;<lpage>814</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/oxfordjournals.molbev.a004137</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname> <given-names>C. H.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Qi</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>Multiple polyploidization events across asteraceae with two nested events in the early history revealed by nuclear phylogenomics</article-title>. <source>Mol. Biol. Evol.</source> <volume>33</volume>, <fpage>2820</fpage>&#x2013;<lpage>2835</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msw157</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ilic</surname> <given-names>K.</given-names>
</name>
<name>
<surname>SanMiguel</surname> <given-names>P. J.</given-names>
</name>
<name>
<surname>Bennetzen</surname> <given-names>J. L.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>A complex history of rearrangement in an orthologous region of the maize, sorghum, and rice genomes</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>100</volume>, <fpage>12265</fpage>&#x2013;<lpage>12270</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1434476100</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jackman</surname> <given-names>S. D.</given-names>
</name>
<name>
<surname>Coombe</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Chu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Warren</surname> <given-names>R. L.</given-names>
</name>
<name>
<surname>Vandervalk</surname> <given-names>B. P.</given-names>
</name>
<name>
<surname>Yeo</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Tigmint: correcting assembly errors using linked reads from large molecules</article-title>. <source>BMC Bioinf.</source> <volume>19</volume>, <fpage>393</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12859-018-2425-6</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jana</surname> <given-names>B. K.</given-names>
</name>
<name>
<surname>Mukherjee</surname> <given-names>S. K.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Pappus structure in the family compositae- a short communication</article-title>. <source>Int. J. Sci. Res.</source> <volume>3</volume>, <fpage>29</fpage>&#x2013;<lpage>30</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.15373/22778179/may2014/9</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jones</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Binns</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Chang</surname> <given-names>H.-Y.</given-names>
</name>
<name>
<surname>Fraser</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>W.</given-names>
</name>
<name>
<surname>McAnulla</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2014</year>). <article-title>InterProScan 5: genome-scale protein function classification</article-title>. <source>Bioinformatics</source> <volume>30</volume>, <fpage>1236</fpage>&#x2013;<lpage>1240</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btu031</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Cui</surname> <given-names>M. L.</given-names>
</name>
<name>
<surname>Cubas</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Gillies</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Chapman</surname> <given-names>M. A.</given-names>
</name>
<etal/>
</person-group>. (<year>2008</year>). <article-title>Regulatory genes control a key morphological and ecological trait transferred between species</article-title>. <source>Science</source> <volume>80-.). 322</volume>, <fpage>1116</fpage>&#x2013;<lpage>1119</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.1164371</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Koren</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Walenz</surname> <given-names>B. P.</given-names>
</name>
<name>
<surname>Berlin</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Miller</surname> <given-names>J. R.</given-names>
</name>
<name>
<surname>Bergman</surname> <given-names>N. H.</given-names>
</name>
<name>
<surname>Phillippy</surname> <given-names>A. M.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Canu: scalable and accurate long-read assembly <italic>via</italic> adaptive &#x3ba;-mer weighting and repeat separation</article-title>. <source>Genome Res.</source> <volume>27</volume>, <fpage>722</fpage>&#x2013;<lpage>736</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/gr.215087.116</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kosugi</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Ohashi</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>1997</year>). <article-title>PCF1 and PCF2 specifically bind to cis elements in the rice proliferating cell nuclear antigen gene</article-title>. <source>Plant Cell</source> <volume>9</volume>, <fpage>1607</fpage>&#x2013;<lpage>1619</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1105/tpc.9.9.1607</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kramer</surname> <given-names>E. M.</given-names>
</name>
<name>
<surname>Jaramillo</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Di Stilio</surname> <given-names>V. S.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Patterns of gene duplication and functional evolution during the diversification of the AGAMOUS subfamily of MADS box genes in angiosperms</article-title>. <source>Genetics</source> <volume>166</volume>, <fpage>1011</fpage>&#x2013;<lpage>1023</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/genetics/166.2.1011</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kristensen</surname> <given-names>D. M.</given-names>
</name>
<name>
<surname>Wolf</surname> <given-names>Y. I.</given-names>
</name>
<name>
<surname>Mushegian</surname> <given-names>A. R.</given-names>
</name>
<name>
<surname>Koonin</surname> <given-names>E. V.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Computational methods for gene orthology inference</article-title>. <source>Brief. Bioinform.</source> <volume>12</volume>, <fpage>379</fpage>&#x2013;<lpage>391</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bib/bbr030</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Laetsch</surname> <given-names>D. R.</given-names>
</name>
<name>
<surname>Blaxter</surname> <given-names>M. L.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>BlobTools: interrogation of genome assemblies</article-title>. <source>F1000Research</source> <volume>6</volume>, <fpage>1287</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.12688/f1000research.12232.1</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Langham</surname> <given-names>R. J.</given-names>
</name>
<name>
<surname>Walsh</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Dunn</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Ko</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Goff</surname> <given-names>S. A.</given-names>
</name>
<name>
<surname>Freeling</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Genomic duplication, fractionation and the origin of regulatory novelty</article-title>. <source>Genetics</source> <volume>166</volume>, <fpage>935</fpage>&#x2013;<lpage>945</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/genetics/166.2.935</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Letunic</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Bork</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Interactive tree of life (iTOL) v5: an online tool for phylogenetic tree display and annotation</article-title>. <source>Nucleic Acids Res.</source> <volume>49</volume>, <fpage>W293</fpage>&#x2013;<lpage>W296</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/NAR/GKAB301</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>The arabidopsis thaliana TCP transcription factors: a broadening horizon beyond development</article-title>. <source>Plant Signal. Behav.</source> <volume>10</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/15592324.2015.1044192</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Minimap2: pairwise alignment for nucleotide sequences</article-title>. <source>Bioinformatics</source> <volume>34</volume>, <fpage>3094</fpage>&#x2013;<lpage>3100</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bty191</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liljegren</surname> <given-names>S. J.</given-names>
</name>
<name>
<surname>Ditta</surname> <given-names>G. S.</given-names>
</name>
<name>
<surname>Eshed</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Savidge</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Bowmant</surname> <given-names>J. L.</given-names>
</name>
<name>
<surname>Yanofsky</surname> <given-names>M. F.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>
<italic>SHATTERPROOF MADS-box</italic> genes control dispersal in arabidopsis</article-title>. <source>Nat.</source> <volume>404</volume>, <fpage>766</fpage>&#x2013;<lpage>770</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/35008089</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lin</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Du</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Fan</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Hai</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Extensive sequence divergence between the reference genomes of taraxacum kok-saghyz and taraxacum mongolicum</article-title>. <source>Sci. China Life Sci.</source> <volume>653 65</volume>, <fpage>515</fpage>&#x2013;<lpage>528</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/S11427-021-2033-2</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lockton</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Gaut</surname> <given-names>B. S.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Plant conserved non-coding sequences and paralogue evolution</article-title>. <source>Trends Genet.</source> <volume>21</volume>, <fpage>60</fpage>&#x2013;<lpage>65</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.tig.2004.11.013</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lomsadze</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Burns</surname> <given-names>P. D.</given-names>
</name>
<name>
<surname>Borodovsky</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Integration of mapped RNA-seq reads into automatic training of eukaryotic gene finding algorithm</article-title>. <source>Nucleic Acids Res.</source> <volume>42</volume>, <fpage>e119</fpage>&#x2013;<lpage>e119</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gku557</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luo</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Carpenter</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Vincent</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Copsey</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Coen</surname> <given-names>E.</given-names>
</name>
</person-group> (<year>1996</year>). <article-title>Origin of floral asymmetry in antirrhinum</article-title>. <source>Nature</source> <volume>383</volume>, <fpage>794</fpage>&#x2013;<lpage>799</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/383794a0</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Magadum</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Banerjee</surname> <given-names>U.</given-names>
</name>
<name>
<surname>Murugan</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Gangapur</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Ravikesavan</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Gene duplication as a major force in evolution</article-title>. <source>J. Genet.</source> <volume>92</volume>, <fpage>155</fpage>&#x2013;<lpage>161</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s12041-013-0212-8</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mandel</surname> <given-names>J. R.</given-names>
</name>
<name>
<surname>Dikow</surname> <given-names>R. B.</given-names>
</name>
<name>
<surname>Siniscalchi</surname> <given-names>C. M.</given-names>
</name>
<name>
<surname>Thapa</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Watson</surname> <given-names>L. E.</given-names>
</name>
<name>
<surname>Funk</surname> <given-names>V. A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>A fully resolved backbone phylogeny reveals numerous dispersals and explosive diversifications throughout the history of asteraceae</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>116</volume>, <fpage>14083</fpage>&#x2013;<lpage>14088</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1903871116</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Manni</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Berkeley</surname> <given-names>M. R.</given-names>
</name>
<name>
<surname>Seppey</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Sim&#xe3;o</surname> <given-names>F. A.</given-names>
</name>
<name>
<surname>Zdobnov</surname> <given-names>E. M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>BUSCO update: novel and streamlined workflows along with broader and deeper phylogenetic coverage for scoring of eukaryotic, prokaryotic, and viral genomes</article-title>. <source>Mol. Biol. Evol.</source> <volume>38</volume>, <fpage>4647</fpage>&#x2013;<lpage>4654</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msab199</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Martin</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Cutadapt removes adapter sequences from high-throughput sequencing reads</article-title>. <source>EMBnet.journal</source> <volume>17</volume>, <elocation-id>10</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.14806/ej.17.1.200</pub-id>
</citation>
</ref>  <ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mart&#xed;n-Trillo</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Cubas</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>
<italic>TCP</italic> genes: a family snapshot ten years later</article-title>. <source>Trends Plant Sci</source> <volume>15</volume>, <fpage>31</fpage>&#x2013;<lpage>39</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.tplants.2009.11.003</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mistry</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Finn</surname> <given-names>R. D.</given-names>
</name>
<name>
<surname>Eddy</surname> <given-names>S. R.</given-names>
</name>
<name>
<surname>Bateman</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Punta</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Challenges in homology search: HMMER3 and convergent evolution of coiled-coil regions</article-title>. <source>Nucleic Acids Res.</source> <volume>41</volume>, <fpage>e121</fpage>&#x2013;<lpage>e121</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkt263</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nath</surname> <given-names>U.</given-names>
</name>
<name>
<surname>Crawford</surname> <given-names>B. C. W.</given-names>
</name>
<name>
<surname>Carpenter</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Coen</surname> <given-names>E.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Genetic control of surface curvature</article-title>. <source>Science</source> <volume>80-.). 299</volume>, <fpage>1404</fpage>&#x2013;<lpage>1407</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.1079354</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Navaud</surname> <given-names>O.</given-names>
</name>
<name>
<surname>Dabos</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Carnus</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Tremousaygue</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Herv&#xe9;</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>TCP Transcription factors predate the emergence of land plants</article-title>. <source>J. Mol. Evol</source> <volume>65</volume>, <fpage>23</fpage>&#x2013;<lpage>33</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00239-006-0174-z</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nguyen</surname> <given-names>L. T.</given-names>
</name>
<name>
<surname>Schmidt</surname> <given-names>H. A.</given-names>
</name>
<name>
<surname>Von Haeseler</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Minh</surname> <given-names>B. Q.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>IQ-TREE: a fast and effective stochastic algorithm for estimating maximum-likelihood phylogenies</article-title>. <source>Mol. Biol. Evol.</source> <volume>32</volume>, <fpage>268</fpage>&#x2013;<lpage>274</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msu300</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ning</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Han</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>W.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Genome-wide analysis of <italic>MADS-box</italic> family genes during flower development in lettuce</article-title>. <source>Plant Cell Environ.</source> <volume>42</volume>, <fpage>1868</fpage>&#x2013;<lpage>1881</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/pce.13523</pub-id>
</citation>
</ref>
<ref id="B62">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Ohno</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>1970</year>). <source>Evolution by gene duplication</source> (<publisher-loc>New York</publisher-loc>: <publisher-name>Springer-Verlag</publisher-name>).</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Palazzesi</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Pellicer</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Barreda</surname> <given-names>V. D.</given-names>
</name>
<name>
<surname>Loeuille</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Mandel</surname> <given-names>J. R.</given-names>
</name>
<name>
<surname>Pokorny</surname> <given-names>L.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Asteraceae as a model system for evolutionary studies: from fossils to genomes</article-title>. <source>Bot. J. Linn. Soc</source> <volume>200</volume>, <fpage>143</fpage>&#x2013;<lpage>164</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/botlinnean/boac032</pub-id>
</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Panchy</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Lehti-Shiu</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Shiu</surname> <given-names>S.-H.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Evolution of gene duplication in plants</article-title>. <source>Plant Physiol.</source> <volume>171</volume>, <fpage>2294</fpage>&#x2013;<lpage>2316</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1104/pp.16.00523</pub-id>
</citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Panero</surname> <given-names>J. L.</given-names>
</name>
<name>
<surname>Funk</surname> <given-names>V. A.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>The value of sampling anomalous taxa in phylogenetic studies: major clades of the asteraceae revealed</article-title>. <source>Mol. Phylogenet. Evol.</source> <volume>47</volume>, <fpage>757</fpage>&#x2013;<lpage>782</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ympev.2008.02.011</pub-id>
</citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pei</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Bai</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>T.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Comparative analysis of the TCP gene family in celery, coriander and carrot (family apiaceae)</article-title>. <source>Veg. Res.</source> <volume>11 1</volume>, <fpage>1</fpage>&#x2013;<lpage>12</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.48130/VR-2021-0005</pub-id>
</citation>
</ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pelaz</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Ditta</surname> <given-names>G. S.</given-names>
</name>
<name>
<surname>Baumann</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Wisman</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Yanofsky</surname> <given-names>M. F.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>B and c floral organ identity functions require <italic>SEPALLATA MADS-box</italic> genes</article-title>. <source>Nature</source> <volume>405</volume>, <fpage>200</fpage>&#x2013;<lpage>203</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/35012103</pub-id>
</citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pertea</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Pertea</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>GFF utilities: GffRead and GffCompare</article-title>. <source>F1000Research</source> <volume>9</volume>, <fpage>304</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.12688/f1000research.23297.2</pub-id>
</citation>
</ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pinyopich</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Ditta</surname> <given-names>G. S.</given-names>
</name>
<name>
<surname>Savidge</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Liljegren</surname> <given-names>S. J.</given-names>
</name>
<name>
<surname>Baumann</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Wisman</surname> <given-names>E.</given-names>
</name>
<etal/>
</person-group>. (<year>2003</year>). <article-title>Assessing the redundancy of <italic>MADS-box</italic> genes during carpel and ovule development</article-title>. <source>Nature</source> <volume>424</volume>, <fpage>85</fpage>&#x2013;<lpage>88</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nature01741</pub-id>
</citation>
</ref>
<ref id="B70">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pramanik</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Dorst</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Meesters</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Spaans</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Smets</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Welten</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Evolution and development of three highly specialized floral structures of bee-pollinated phalaenopsis species</article-title>. <source>Evodevo</source> <volume>11</volume>, <fpage>1</fpage>&#x2013;<lpage>20</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13227-020-00160-z</pub-id>
</citation>
</ref>
<ref id="B71">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rice</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Longden</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Bleasby</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>EMBOSS: the European molecular biology open software suite</article-title>. <source>Trends Genet.</source> <volume>16</volume>, <fpage>276</fpage>&#x2013;<lpage>277</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0168-9525(00)02024-2</pub-id>
</citation>
</ref>
<ref id="B72">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rijpkema</surname> <given-names>A. S.</given-names>
</name>
<name>
<surname>Vandenbussche</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Koes</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Heijmans</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Gerats</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Variations on a theme: changes in the floral ABCs in angiosperms. semin</article-title>. <source>Cell Dev. Biol.</source> <volume>21</volume>, <fpage>100</fpage>&#x2013;<lpage>107</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.semcdb.2009.11.002</pub-id>
</citation>
</ref>
<ref id="B73">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rosvall</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Bergstrom</surname> <given-names>C. T.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Maps of random walks on complex networks reveal community structure</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>105</volume>, <fpage>1118</fpage>&#x2013;<lpage>1123</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.0706851105</pub-id>
</citation>
</ref>
<ref id="B74">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ruelens</surname> <given-names>P.</given-names>
</name>
<name>
<surname>De Maagd</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Proost</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Thei&#xdf;en</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Geuten</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Kaufmann</surname> <given-names>K.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>
<italic>FLOWERING LOCUS</italic> c in monocots and the tandem origin of angiosperm-specific <italic>MADS-box</italic> genes</article-title>. <source>Nat. Commun.</source> <volume>4</volume>, <fpage>1</fpage>&#x2013;<lpage>8</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/ncomms3280</pub-id>
</citation>
</ref>
<ref id="B75">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sato</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Tabata</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Hirakawa</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Asamizu</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Shirasawa</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Isobe</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2012</year>). <article-title>The tomato genome sequence provides insights into fleshy fruit evolution</article-title>. <source>Nature</source> <volume>485</volume>, <fpage>635</fpage>&#x2013;<lpage>641</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nature11119</pub-id>
</citation>
</ref>
<ref id="B76">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shannon</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Markiel</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Ozier</surname> <given-names>O.</given-names>
</name>
<name>
<surname>Baliga</surname> <given-names>N. S.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J. T.</given-names>
</name>
<name>
<surname>Ramage</surname> <given-names>D.</given-names>
</name>
<etal/>
</person-group>. (<year>2003</year>). <article-title>Cytoscape: a software environment for integrated models of biomolecular interaction networks</article-title>. <source>Genome Res.</source> <volume>13</volume>, <fpage>2498</fpage>&#x2013;<lpage>2504</lpage>. doi: <pub-id pub-id-type="doi">10.1101/gr.1239303</pub-id>
</citation>
</ref>
<ref id="B77">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shen</surname> <given-names>C. Z.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>C. J.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>Y. P.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Clarifying recent adaptive diversification of the chrysanthemum-group on the basis of an updated multilocus phylogeny of subtribe artemisiinae (Asteraceae: anthemideae)</article-title>. <source>Front. Plant Sci.</source> <volume>12</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2021.648026</pub-id>
</citation>
</ref>
<ref id="B78">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Smaczniak</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Immink</surname> <given-names>R. G. H.</given-names>
</name>
<name>
<surname>Mui&#xf1;o</surname> <given-names>J. M.</given-names>
</name>
<name>
<surname>Blanvillain</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Busscher</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Busscher-Lange</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2012</year>). <article-title>Characterization of MADS-domain transcription factor complexes in arabidopsis flower development</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>109</volume>, <fpage>1560</fpage>&#x2013;<lpage>1565</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1112871109</pub-id>
</citation>
</ref>
<ref id="B79">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Smit</surname> <given-names>A. F. A.</given-names>
</name>
<name>
<surname>Hubley</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Green</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2019</year>). <source>2013&#x2013;2015. RRepeatMasker Open-4.0</source>. Available at: <uri xlink:href="http://www.repeatmasker.org">http://www.repeatmasker.org</uri>.</citation>
</ref>
<ref id="B80">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Smith</surname> <given-names>R. I. L.</given-names>
</name>
<name>
<surname>Richardson</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Fuegian plants in Antarctica: natural or anthropogenically assisted immigrants</article-title>? <source>Biol. Invasions</source> <volume>13</volume>, <fpage>1</fpage>&#x2013;<lpage>5</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10530-010-9784-x</pub-id>
</citation>
</ref>
<ref id="B81">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stanke</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Diekhans</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Baertsch</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Haussler</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Using native and syntenically mapped cDNA alignments to improve <italic>de novo</italic> gene finding</article-title>. <source>Bioinformatics</source> <volume>24</volume>, <fpage>637</fpage>&#x2013;<lpage>644</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btn013</pub-id>
</citation>
</ref>
<ref id="B82">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Stevens</surname> <given-names>P. F.</given-names>
</name>
</person-group> (<year>2017</year>) <source>Angiosperm phylogeny website. version 14</source> (<publisher-loc>St. Louis, Missouri USA</publisher-loc>: <publisher-name>Missouri Bot. Gard</publisher-name>). Available at: <uri xlink:href="http://www.mobot.org/MOBOT/research/APweb/">http://www.mobot.org/MOBOT/research/APweb/</uri> (Accessed <access-date>October 23, 2022</access-date>).</citation>
</ref>
<ref id="B83">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stuessy</surname> <given-names>T. F.</given-names>
</name>
<name>
<surname>Garver</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>1996</year>). <article-title>The defensive role of pappus in heads of compositae</article-title>. <source>Compos. Biol. Util.</source> <volume>2</volume>, <fpage>81</fpage>&#x2013;<lpage>91</lpage>.</citation>
</ref>
<ref id="B84">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Susanna</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Baldwin</surname> <given-names>B. G.</given-names>
</name>
<name>
<surname>Bayer</surname> <given-names>R. J.</given-names>
</name>
<name>
<surname>Bonifacino</surname> <given-names>J. M.</given-names>
</name>
<name>
<surname>Garcia-Jacas</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Keeley</surname> <given-names>S. C.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>The classification of the compositae: a tribute to Vicki Ann funk, (1947&#x2013;2019)</article-title>. <source>Taxon</source> <volume>69</volume>, <fpage>807</fpage>&#x2013;<lpage>814</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/tax.12235</pub-id>
</citation>
</ref>
<ref id="B85">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Suyama</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Torrents</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Bork</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>PAL2NAL: robust conversion of protein sequence alignments into the corresponding codon alignments</article-title>. <source>Nucleic Acids Res.</source> <volume>34</volume>, <fpage>W609&#x2013;W612</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkl315</pub-id>
</citation>
</ref>
<ref id="B86">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tahtiharju</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Rijpkema</surname> <given-names>A. S.</given-names>
</name>
<name>
<surname>Vetterli</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Albert</surname> <given-names>V. A.</given-names>
</name>
<name>
<surname>Teeri</surname> <given-names>T. H.</given-names>
</name>
<name>
<surname>Elomaa</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Evolution and diversification of the CYC/TB1 gene family in asteraceae&#x2013;a comparative study in gerbera (Mutisieae) and sunflower (Heliantheae)</article-title>. <source>Mol. Biol. Evol.</source> <volume>29</volume>, <fpage>1155</fpage>&#x2013;<lpage>1166</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msr283</pub-id>
</citation>
</ref>
<ref id="B88">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thei&#xdf;en</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>J. T.</given-names>
</name>
<name>
<surname>Saedler</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>1996</year>). <article-title>Classification and phylogeny of the <italic>MADS-box</italic> multigene family suggest defined roles of <italic>MADS-box</italic> gene subfamilies in the morphological evolution of eukaryotes</article-title>. <source>J. Mol. Evol.</source> <volume>43</volume>, <fpage>484</fpage>&#x2013;<lpage>516</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/BF02337521</pub-id>
</citation>
</ref>
<ref id="B89">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thei&#xdf;en</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Melzer</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Ru&#xfc;mpler</surname> <given-names>F.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>MADS-domain transcription factors and the floral quartet model of flower development: linking plant development and evolution</article-title>. <source>Dev.</source> <volume>143</volume>, <fpage>3259</fpage>&#x2013;<lpage>3271</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1242/dev.134080</pub-id>
</citation>
</ref>
<ref id="B87">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Theissen</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Becker</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Rosa</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Kanno</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>J. T.</given-names>
</name>
<name>
<surname>M&#xfc;nster</surname> <given-names>T.</given-names>
</name>
<etal/>
</person-group>. (<year>2000</year>)<article-title>A short history of <italic>MADS-box</italic> genes in plants</article-title>. Available at: <uri xlink:href="http://www.mpiz-koeln.mpg.de/mads/">http://www.mpiz-koeln.mpg.de/mads/</uri> (Accessed <access-date>November 2, 2021</access-date>).</citation>
</ref>
<ref id="B90">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Underwood</surname> <given-names>C. J.</given-names>
</name>
<name>
<surname>Vijverberg</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Rigola</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Okamoto</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Oplaat</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Camp</surname> <given-names>R. H. M. O.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>A PARTHENOGENESIS allele from apomictic dandelion can induce egg cell division without fertilization in lettuce</article-title>. <source>Nat. Genet.</source> <volume>54</volume>, <fpage>84</fpage>&#x2013;<lpage>93</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41588-021-00984-y</pub-id>
</citation>
</ref>
<ref id="B91">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Van Dijk</surname> <given-names>P. J.</given-names>
</name>
<name>
<surname>Op den Camp</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Schauer</surname> <given-names>S. E.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Genetic dissection of apomixis in dandelions identifies a dominant parthenogenesis locus and highlights the complexity of autonomous endosperm formation</article-title>. <source>Genes (Basel).</source> <volume>11</volume>, <elocation-id>961</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/genes11090961</pub-id>
</citation>
</ref>
<ref id="B92">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Van Dijk</surname> <given-names>P. J.</given-names>
</name>
<name>
<surname>Tas</surname> <given-names>I. C. Q.</given-names>
</name>
<name>
<surname>Falque</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Bakx-Schotman</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>1999</year>). <article-title>Crosses between sexual and apomictic dandelions (Taraxacum). II. the breakdown of apomixis</article-title>. <source>Heredity (Edinb).</source> <volume>83</volume>, <fpage>715</fpage>&#x2013;<lpage>721</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1046/j.1365-2540.1999.00620.x</pub-id>
</citation>
</ref>
<ref id="B93">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vaser</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Sovi&#x107;</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Nagarajan</surname> <given-names>N.</given-names>
</name>
<name>
<surname>&#x160;iki&#x107;</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Fast and accurate <italic>de novo</italic> genome assembly from long uncorrected reads</article-title>. <source>Genome Res.</source> <volume>27</volume>, <fpage>737</fpage>&#x2013;<lpage>746</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/gr.214270.116</pub-id>
</citation>
</ref>
<ref id="B94">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Verhoeven</surname> <given-names>K. J. F.</given-names>
</name>
<name>
<surname>Biere</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Geographic parthenogenesis and plant-enemy interactions in the common dandelion</article-title>. <source>BMC Evol. Biol.</source> <volume>13</volume>, <fpage>1</fpage>&#x2013;<lpage>8</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2148-13-23</pub-id>
</citation>
</ref>
<ref id="B95">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Verhoeven</surname> <given-names>K. J. F.</given-names>
</name>
<name>
<surname>Verbon</surname> <given-names>E. H.</given-names>
</name>
<name>
<surname>van Gurp</surname> <given-names>T. P.</given-names>
</name>
<name>
<surname>Oplaat</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Ferreira de Carvalho</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Morse</surname> <given-names>A. M.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Intergenerational environmental effects: functional signals in offspring transcriptomes and metabolomes after parental jasmonic acid treatment in apomictic dandelion</article-title>. <source>New Phytol.</source> <volume>217</volume>, <fpage>871</fpage>&#x2013;<lpage>882</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/nph.14835</pub-id>
</citation>
</ref>
<ref id="B96">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vijverberg</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Milanovic-Ivanovic</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Bakx-Schotman</surname> <given-names>T.</given-names>
</name>
<name>
<surname>van Dijk</surname> <given-names>P. J.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Genetic fine-mapping of DIPLOSPOROUS in taraxacum (dandelion; asteraceae) indicates a duplicated DIP-gene</article-title>. <source>BMC Plant Biol.</source> <volume>10</volume>, <elocation-id>154</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2229-10-154</pub-id>
</citation>
</ref>
<ref id="B97">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vijverberg</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Ozias-Akins</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Schranz</surname> <given-names>M. E.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Identifying and engineering genes for parthenogenesis in plants</article-title>. <source>Front. Plant Sci.</source> <volume>10</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2019.00128</pub-id>
</citation>
</ref>
<ref id="B98">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vijverberg</surname> <given-names>K.</given-names>
</name>
<name>
<surname>van der Hulst</surname> <given-names>R. G. M.</given-names>
</name>
<name>
<surname>Lindhout</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Van Dijk</surname> <given-names>P. J.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>A genetic linkage map of the diplosporous chromosomal region in taraxacum officinale (common dandelion; asteraceae)</article-title>. <source>Theor. Appl. Genet.</source> <volume>108</volume>, <fpage>725</fpage>&#x2013;<lpage>732</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00122-003-1474-y</pub-id>
</citation>
</ref>
<ref id="B99">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vijverberg</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Welten</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Kraaij</surname> <given-names>M.</given-names>
</name>
<name>
<surname>van Heuven</surname> <given-names>B. J.</given-names>
</name>
<name>
<surname>Smets</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Gravendeel</surname> <given-names>B.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Sepal identity of the pappus and floral organ development in the common dandelion (Taraxacum officinale; asteraceae)</article-title>. <source>Plants</source> <volume>10</volume>, <elocation-id>1682</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/plants10081682</pub-id>
</citation>
</ref>
<ref id="B100">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Walker</surname> <given-names>B. J.</given-names>
</name>
<name>
<surname>Abeel</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Shea</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Priest</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Abouelliel</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Sakthikumar</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2014</year>). <article-title>Pilon: an integrated tool for comprehensive microbial variant detection and genome assembly improvement</article-title>. <source>PloS One</source> <volume>9</volume>, <elocation-id>e112963</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0112963</pub-id>
</citation>
</ref>
<ref id="B101">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Tang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>DeBarry</surname> <given-names>J. D.</given-names>
</name>
<name>
<surname>Tan</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X.</given-names>
</name>
<etal/>
</person-group>. (<year>2012</year>). <article-title>MCScanX: a toolkit for detection and evolutionary analysis of gene synteny and collinearity</article-title>. <source>Nucleic Acids Res.</source> <volume>40</volume>, <fpage>e49</fpage>&#x2013;<lpage>e49</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkr1293</pub-id>
</citation>
</ref>
<ref id="B102">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Won</surname> <given-names>S. Y.</given-names>
</name>
<name>
<surname>Jung</surname> <given-names>J. A.</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>J. S.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Genome-wide analysis of the <italic>MADS-box</italic> gene family in chrysanthemum</article-title>. <source>Comput. Biol. Chem.</source> <volume>90</volume>, <elocation-id>107424</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compbiolchem.2020.107424</pub-id>
</citation>
</ref>
<ref id="B103">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yeo</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Coombe</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Warren</surname> <given-names>R. L.</given-names>
</name>
<name>
<surname>Chu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Birol</surname> <given-names>I.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>ARCS: scaffolding genome drafts with linked reads</article-title>. <source>Bioinformatics</source> <volume>34</volume>, <fpage>725</fpage>&#x2013;<lpage>731</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btx675</pub-id>
</citation>
</ref>
<ref id="B104">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Juntheikki</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Mouhu</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Broholm</surname> <given-names>S. K.</given-names>
</name>
<name>
<surname>Rijpkema</surname> <given-names>A. S.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Dissecting functions of SEPALLATA-like <italic>MADS-box</italic> genes in patterning of the pseudanthial inflorescence of gerbera hybrida</article-title>. <source>New Phytol.</source> <volume>216</volume>, <fpage>939</fpage>&#x2013;<lpage>954</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/nph.14707</pub-id>
</citation>
</ref>
<ref id="B105">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Holmer</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Bruijn</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Angenent</surname> <given-names>G. C.</given-names>
</name>
<name>
<surname>van den Burg</surname> <given-names>H. A.</given-names>
</name>
<name>
<surname>Schranz</surname> <given-names>M. E.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Phylogenomic synteny network analysis of <italic>MADS-box</italic> transcription factor genes reveals lineage-specific transpositions, ancient tandem duplications, and deep positional conservation</article-title>. <source>Plant Cell</source> <volume>29</volume>, <fpage>1278&#x2013;1292</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1105/tpc.17.00312</pub-id>
</citation>
</ref>
<ref id="B106">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Schranz</surname> <given-names>M. E.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Network approaches for plant phylogenomic synteny analysis</article-title>. <source>Curr. Opin. Plant Biol.</source> <volume>36</volume>, <fpage>129</fpage>&#x2013;<lpage>134</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.pbi.2017.03.001</pub-id>
</citation>
</ref>
<ref id="B107">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Schranz</surname> <given-names>M. E.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Network-based microsynteny analysis identifies major differences and genomic outliers in mammalian and angiosperm genomes</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>116</volume>, <fpage>2165</fpage>&#x2013;<lpage>2174</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1801757116</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>