<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2023.1258794</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Chloroplast genome assembly of <italic>Serjania erecta</italic> Raldk: comparative analysis reveals gene number variation and selection in protein-coding plastid genes of Sapindaceae</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Corval&#xe1;n</surname>
<given-names>Leonardo C. J.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Sobreiro</surname>
<given-names>Mariane B.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/908389"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Carvalho</surname>
<given-names>Larissa R.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Dias</surname>
<given-names>Renata O.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/659899"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Braga-Ferreira</surname>
<given-names>Ramilla S.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Targueta</surname>
<given-names>Cintia P.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Silva-Neto</surname>
<given-names>Carlos M. e</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Berton</surname>
<given-names>Bianca W.</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/692327"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Pereira</surname>
<given-names>Ana Maria S.</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Diniz-filho</surname>
<given-names>Jos&#xe9; A. F.</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Telles</surname>
<given-names>Mariana P. C.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/555840"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Nunes</surname>
<given-names>Rhewter</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1118824"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Laborat&#xf3;rio de Gen&#xe9;tica &amp; Biodiversidade, Universidade Federal de Goi&#xe1;s</institution>, <addr-line>Goi&#xe2;nia</addr-line>, <country>Brazil</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Instituto de Ci&#xea;ncias Exatas e Naturais, Universidade Federal de Rondon&#xf3;polis</institution>, <addr-line>Rondon&#xf3;polis</addr-line>, <country>Brazil</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Instituto Federal de Goi&#xe1;s</institution>, <addr-line>Goi&#xe1;s</addr-line>, <country>Brazil</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Universidade de Ribeir&#xe3;o Preto</institution>, <addr-line>Ribeir&#xe3;o Preto</addr-line>, <country>Brazil</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Laborat&#xf3;rio de Ecologia Te&#xf3;rica e S&#xed;ntese, Universidade Federal de Goi&#xe1;s</institution>, <addr-line>Goi&#xe2;nia</addr-line>, <country>Brazil</country>
</aff>
<aff id="aff6">
<sup>6</sup>
<institution>Escola de Ci&#xea;ncias M&#xe9;dicas e da Vida, Pontif&#xed;cia Universidade Cat&#xf3;lica de Goi&#xe1;s</institution>, <addr-line>Goi&#xe2;nia</addr-line>, <country>Brazil</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: George Popescu, Mississippi State University, United States</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Khurram Shahzad, Chinese Academy of Sciences (CAS), China; Eric Wade Linton, Central Michigan University, United States</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Rhewter Nunes, <email xlink:href="mailto:rhewter@gmail.com">rhewter@gmail.com</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>26</day>
<month>09</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>14</volume>
<elocation-id>1258794</elocation-id>
<history>
<date date-type="received">
<day>14</day>
<month>07</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>06</day>
<month>09</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2023 Corval&#xe1;n, Sobreiro, Carvalho, Dias, Braga-Ferreira, Targueta, Silva-Neto, Berton, Pereira, Diniz-filho, Telles and Nunes</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Corval&#xe1;n, Sobreiro, Carvalho, Dias, Braga-Ferreira, Targueta, Silva-Neto, Berton, Pereira, Diniz-filho, Telles and Nunes</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>
<italic>Serjania erecta</italic> Raldk is an essential genetic resource due to its anti-inflammatory, gastric protection, and anti-Alzheimer properties. However, the genetic and evolutionary aspects of the species remain poorly known. Here, we sequenced and assembled the complete chloroplast genome of <italic>S. erecta</italic> and used it in a comparative analysis within the Sapindaceae family. <italic>S. erecta</italic> has a chloroplast genome (cpDNA) of 159,297 bp, divided into a Large Single Copy region (LSC) of 84,556 bp and a Small Single Copy region (SSC) of 18,057 bp that are surrounded by two Inverted Repeat regions (IRa and IRb) of 28,342 bp. Among the 12 species used in the comparative analysis, <italic>S. erecta</italic> has the fewest long and microsatellite repeats. The genome structure of Sapindaceae species is relatively conserved; the number of genes varies from 128 to 132 genes, and this variation is associated with three main factors: (1) Expansion and retraction events in the size of the IRs, resulting in variations in the number of <italic>rpl22</italic>, <italic>rps19</italic>, and <italic>rps3</italic> genes; (2) Pseudogenization of the <italic>rps2</italic> gene; and (3) Loss or duplication of genes encoding tRNAs, associated with the duplication of <italic>trnH-GUG</italic> in <italic>X. sorbifolium</italic> and the absence of <italic>trnT-CGU</italic> in the Dodonaeoideae subfamily. We identified 10 and 11 mutational hotspots for Sapindaceae and Sapindoideae, respectively, and identified six highly diverse regions (<italic>tRNA-Lys &#x2014; rps16, ndhC &#x2013; tRNA-Val, petA &#x2013; psbJ, ndhF, rpl32 &#x2013; ccsA</italic>, and <italic>ycf1</italic>) are found in both groups, which show potential for the development of DNA barcode markers for molecular taxonomic identification of <italic>Serjania</italic>. We identified that the <italic>psaI</italic> gene evolves under neutrality in Sapindaceae, while all other chloroplast genes are under strong negative selection. However, local positive selection exists in the <italic>ndhF</italic>, <italic>rpoC2</italic>, <italic>ycf1</italic>, and <italic>ycf2</italic> genes. The genes <italic>ndhF</italic> and <italic>ycf1</italic> also present high nucleotide diversity and local positive selection, demonstrating significant potential as markers. Our findings include providing the first chloroplast genome of a member of the Paullinieae tribe. Furthermore, we identified patterns in variations in the number of genes and selection in genes possibly associated with the family&#x2019;s evolutionary history.</p>
</abstract>
<kwd-group>
<kwd>cpDNA</kwd>
<kwd>molecular evolution</kwd>
<kwd>negative selection</kwd>
<kwd>organellar genome</kwd>
<kwd>plastome</kwd>
</kwd-group>
<counts>
<fig-count count="7"/>
<table-count count="1"/>
<equation-count count="0"/>
<ref-count count="84"/>
<page-count count="14"/>
<word-count count="7709"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Plant Bioinformatics</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Chloroplasts are organelles that play an essential role in photosynthesis, which, due to their origin by endosymbiosis between cyanobacteria and primitive eukaryotic cells, have their own DNA, named cpDNA or chloroplast genome (<xref ref-type="bibr" rid="B46">Margulis and Bermudes, 1985</xref>; <xref ref-type="bibr" rid="B58">Rodr&#xed;guez-Ezpeleta et&#xa0;al., 2005</xref>; <xref ref-type="bibr" rid="B61">Sato, 2020</xref>). In spermatophytes, a quadripartite circular genome pattern is generally observed with two Inverted Repeat regions (IRa and IRb) separated by a Small Single Copy region (SSC) and a Large Single Copy region (LSC) (<xref ref-type="bibr" rid="B27">Jansen and Ruhlman, 2012</xref>; <xref ref-type="bibr" rid="B77">Xiao-Ming et&#xa0;al., 2017</xref>). Chloroplast genomes are generally used to investigate the evolutionary history between species, evaluate patterns of genetic diversity and demographic history of populations, develop DNA barcode markers for molecular taxonomic identification, and as targets for genetic transformation and production of organisms genetically modified (OGMs) (<xref ref-type="bibr" rid="B40">Leebens-Mack et&#xa0;al., 2005</xref>; <xref ref-type="bibr" rid="B11">CBOL Plant Working Group, 2009</xref>; <xref ref-type="bibr" rid="B48">Moore et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B30">Kang et&#xa0;al., 2021</xref>).</p>
<p>In land plants, the number of genes usually varies from 100 to 140, and in some families, such as Sapindaceae, Poaceae, Leguminosae, and Cactaceae, IR expansion and retraction events significantly influence the total number of genes (<xref ref-type="bibr" rid="B73">Wang et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B77">Xiao-Ming et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B65">Souza et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B36">K&#xf6;hler et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B17">Dong et&#xa0;al., 2021</xref>). Although there is some variation in the number, the gene order generally seems to have a phylogenetic pattern of conservation in Angiosperms, showing potential to be used in comparative studies to test evolutionary hypotheses related to collinearity and synteny of plastid genes (<xref ref-type="bibr" rid="B75">Wicke et&#xa0;al., 2011</xref>). The chloroplast genome contains protein-coding and functional RNA-coding genes such as tRNAs (<italic>trn</italic>) and rRNAs (<italic>rrn</italic>). Most of the protein-coding genes are associated with cell replication mechanisms, such as the genes encoding the large subunit of ribosomal proteins (<italic>rpl</italic>) and the small subunit of ribosomal proteins (<italic>rps</italic>), photosystem proteins such as <italic>psa</italic> and <italic>psb</italic> genes, and the genes encoding NADH dehydrogenase proteins (ndh) (<xref ref-type="bibr" rid="B4">Allen et&#xa0;al., 2011</xref>; <xref ref-type="bibr" rid="B27">Jansen and Ruhlman, 2012</xref>).</p>
<p>The Sapindaceae family, also known as the soapberry family, comprises about 1900 species of 144 genera, with approximately 80% of its biodiversity contained in tropical and subtropical regions of the Southern Hemisphere (<xref ref-type="bibr" rid="B2">Acevedo-Rodr&#xed;guez et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B49">Muellner-Riehl et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B3">Acevedo-Rodr&#xed;guez et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B8">Buerki et&#xa0;al., 2021</xref>). Sapindaceae includes plants of different habits, such as trees, shrubs, lianas (woody climbing plants), and herbaceous climbing plants. It also presents species of high economic importance due to their timber, fruit, and medicinal uses (<xref ref-type="bibr" rid="B22">Ferrucci and Acevedo-Rodr&#xed;guez, 2005</xref>; <xref ref-type="bibr" rid="B9">Buerki et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B2">Acevedo-Rodr&#xed;guez et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B49">Muellner-Riehl et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B17">Dong et&#xa0;al., 2021</xref>). More than 50% of the tribes of the Sapindaceae family do not have a representative with a sequenced chloroplast genome, and only 17 genera contain at least one sequenced chloroplast genome (National Center for Biotechnology Information, July 7th, 2023).</p>
<p>The Sapindaceae family emerged at the beginning of the Upper Cretaceous (105 My) and began diversifying approximately 87 My ago in Eurasia. It later diversified throughout the Southern Hemisphere during the Paleocene. Nowadays, this family is subdivided into four subfamilies: (1) Xanthoceroideae, endemic to China; (2) Hippocastanoideae, predominantly occurring in temperate regions; (3) Dodonaeoideae, distributed in tropical and subtropical regions; and (4) Sapindoideae, with wide distribution in tropical and subtropical regions, and it is the most diverse among the four subfamilies (<xref ref-type="bibr" rid="B9">Buerki et&#xa0;al., 2009</xref>). The clades that form tribes in this family are still debated. The most recent botanical revision used proposes 20 tribes, of which 16 belong to the subfamily Sapindoideae, two tribes to the subfamily Dodonaeoideae, two tribes to the subfamily Hippocastanoideae, and in the subfamily Xanthoceratoideae no tribes were classified (<xref ref-type="bibr" rid="B8">Buerki et&#xa0;al., 2021</xref>). Although molecular studies of the group have been carried out using classical markers and next-generation sequencing, evolutionary perspectives of chloroplast genomes across tribes have yet to be evaluated.</p>
<p>In Sapindaceae, the genus <italic>Serjania</italic> Mill. has approximately 230 species distributed from the United States to Argentina. The phylogenetic relationships between species of the genus need to be better defined, presenting extensive polytomies. <italic>Serjania</italic> is the unique liana genus in the Sapindaceae family, and other genera of Sapindaceae are trees, shrubs, or herbs. Furthermore, it is considered the most diverse liana genus in the tropics (<xref ref-type="bibr" rid="B1">Acevedo-Rodriguez, 1990</xref>; <xref ref-type="bibr" rid="B3">Acevedo-Rodr&#xed;guez et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B8">Buerki et&#xa0;al., 2021</xref>). All <italic>Serjania</italic> species with known karyotypes are diploid (2n=24) (<xref ref-type="bibr" rid="B69">Urdampilleta et&#xa0;al., 2012</xref>), and their genomic data are scarce, with no nuclear draft genomes or organellar genomes available in public databases. In our work, <italic>Serjania erecta</italic> Raldk (subfamily Sapindoideae; tribe Paullinieae) is the first liana species to have its chloroplast genome assembled and the second species of the Sapindaceae family from the Americas (the first one is <italic>Dodonaea viscosa</italic>) (<xref ref-type="bibr" rid="B60">Saina et&#xa0;al., 2018</xref>). <italic>Serjania erecta</italic> is a plant traditionally used to treat ulcers and hypertension with potential use in the treatment of Alzheimer&#x2019;s disease, gastric diseases, and anti-inflammatory use (<xref ref-type="bibr" rid="B24">Gomig et&#xa0;al., 2008</xref>; <xref ref-type="bibr" rid="B9">Buerki et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B26">Hiruma-Lima et&#xa0;al., 2009</xref>).</p>
<p>Here, we assembled the chloroplast genome of <italic>Serjania erecta</italic>, the first one of the Paullinieae tribe (Sapindaceae), and used it in comparative analysis with species of the Sapindaceae family to elucidate evolutionary aspects that occurred in these genomes. The comparative analysis had as its main aims to identify: (1) Variations in the number of genes in plastomes of the family Sapindaceae; (2) Selection pressure on genes in chloroplast genomes of the Sapindaceae family; and (3) Regions with potential use as markers for the genus <italic>Serjania</italic>.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>DNA extraction and sequencing</title>
<p>We collected leaves from an individual of <italic>Serjania erecta</italic> in the Ecocerrado Brasil Private Heritage Reserve in Arax&#xe1;, Minas Gerais, Brazil (19&#xb0;36&#x2019;47.1&#x201d; S 47&#xb0;08&#x2019;20.9&#x201d; W altitude 939 m) for DNA extraction. The species was determined using the botanical identification key for the genus (<xref ref-type="bibr" rid="B64">Somner et&#xa0;al., 2015</xref>). Plant material was identified by Dr. In&#xea;s Cordeiro (Instituto Bot&#xe2;nico, S&#xe3;o Paulo, S&#xe3;o Paulo, Brazil), and a voucher specimen was deposited in the Herbarium of Medicinal Plants at UNAERP with voucher number HPMU-835.</p>
<p>Total DNA was extracted using the CTAB protocol (<xref ref-type="bibr" rid="B19">Doyle and Doyle, 1987</xref>) and quantified using horizontal agarose gel electrophoresis (1%). The library for sequencing was constructed using the SureSelectQXT kit (catalog number 5500-0120, Agilent Technologies), and the library quality validation was performed using the Bioanalyzer 2100 (Agilent). Subsequently, the library was sequenced on the MiSeq platform (Illumina) in paired-end mode (2x300) using the MiSeq v3 600 cycles kit (Illumina). All the wet laboratory steps were conducted at the Laboratory of Genetics &amp; Biodiversity &#x2013; LGBio, at the Federal University of Goi&#xe1;s, in Goi&#xe2;nia (GO) &#x2013; Brazil.</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Chloroplast genome assembly and annotation</title>
<p>Assembly of the <italic>S. erecta</italic> genome was carried out using the <italic>Serjania polyphylla rbcL</italic> gene (NCBI accession: GU935455.1) as a seed and 8,814,456 paired-end Illumina reads in the NOVOPlasty v3.2 program (<xref ref-type="bibr" rid="B16">Dierckxsens et&#xa0;al., 2017</xref>). <italic>Serjania erecta</italic> cpDNA annotation was conducted using the GeSeq webserver software (<xref ref-type="bibr" rid="B68">Tillich et&#xa0;al., 2017</xref>). In this program, the prediction of protein-coding genes and ribosomal RNAs (rRNAs) was performed using the HMMER profile Search (<xref ref-type="bibr" rid="B74">Wheeler and Eddy, 2013</xref>) and BLAT search (<xref ref-type="bibr" rid="B33">Kent, 2002</xref>) programs, and the prediction of transporter RNAs (tRNAs) using ARAGORN v1.2.38 (<xref ref-type="bibr" rid="B39">Laslett and Canback, 2004</xref>). Next, annotation problems were manually cured based on annotating other chloroplast genomes from the NCBI Genome as references using the Ugene v44.0 program (<xref ref-type="bibr" rid="B53">Okonechnikov et&#xa0;al., 2012</xref>). The graphical map of the chloroplast genome was made using Organelle Genome Draw (OGDRAW) version 1.3.1 (<xref ref-type="bibr" rid="B44">Lohse et&#xa0;al., 2013</xref>). The frequency of each codon was identified using the Sequence Manipulation Suite webserver: codon usage (<ext-link ext-link-type="uri" xlink:href="https://www.bioinformatics.org/sms2/codon_usage">https://www.bioinformatics.org/sms2/codon_usage</ext-link>).</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Comparative genomic analysis among Sapindaceae cpDNAs</title>
<p>The chloroplast genome of <italic>S. erecta</italic> was compared to 11 species belonging to the Sapindaceae family (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). These genomes were obtained from the Genome database (RefSeq) of the National Center for Biotechnology Information (NCBI) and represent all Sapindaceae genera deposited in this database (NCBI accession numbers in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S1</bold>
</xref>, accessed on July 7, 2023). Subsequently, all genomes were annotated using the same protocol for <italic>S. erecta</italic>.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Description of twelve chloroplast genomes of the family Sapindaceae in a comparative genomic analysis.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<td valign="middle" align="left">Species</td>
<td valign="middle" align="center">Total length</td>
<td valign="middle" align="center">LSC</td>
<td valign="middle" align="center">IR</td>
<td valign="middle" align="center">SSC</td>
<td valign="middle" align="center">GC (%)</td>
<td valign="middle" align="center">Protein</td>
<td valign="middle" align="center">tRNA</td>
<td valign="middle" align="center">rRNA</td>
<td valign="middle" align="center">Total genes</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">
<italic>Serjania erecta</italic>
</td>
<td valign="middle" align="center">159,297</td>
<td valign="middle" align="center">84,556</td>
<td valign="middle" align="center">28,342</td>
<td valign="middle" align="center">18,057</td>
<td valign="middle" align="center">37.90</td>
<td valign="middle" align="center">87</td>
<td valign="middle" align="center">37</td>
<td valign="middle" align="center">8</td>
<td valign="middle" align="center">132</td>
</tr>
<tr>
<td valign="middle" align="left">
<italic>Acer buergerianum</italic>
</td>
<td valign="middle" align="center">156,477</td>
<td valign="middle" align="center">86,246</td>
<td valign="middle" align="center">26,080</td>
<td valign="middle" align="center">18,071</td>
<td valign="middle" align="center">37.88</td>
<td valign="middle" align="center">83</td>
<td valign="middle" align="center">37</td>
<td valign="middle" align="center">8</td>
<td valign="middle" align="center">128</td>
</tr>
<tr>
<td valign="middle" align="left">
<italic>Aesculus wangii</italic>
</td>
<td valign="middle" align="center">155,871</td>
<td valign="middle" align="center">84,882</td>
<td valign="middle" align="center">26,390</td>
<td valign="middle" align="center">18,210</td>
<td valign="middle" align="center">37.95</td>
<td valign="middle" align="center">83</td>
<td valign="middle" align="center">37</td>
<td valign="middle" align="center">8</td>
<td valign="middle" align="center">128</td>
</tr>
<tr>
<td valign="middle" align="left">
<italic>Dimocarpus longan</italic>
</td>
<td valign="middle" align="center">160,833</td>
<td valign="middle" align="center">85,709</td>
<td valign="middle" align="center">28,427</td>
<td valign="middle" align="center">18,270</td>
<td valign="middle" align="center">37.79</td>
<td valign="middle" align="center">87</td>
<td valign="middle" align="center">37</td>
<td valign="middle" align="center">8</td>
<td valign="middle" align="center">132</td>
</tr>
<tr>
<td valign="middle" align="left">
<italic>Dipteronia dyeriana</italic>
</td>
<td valign="middle" align="center">157,071</td>
<td valign="middle" align="center">85,530</td>
<td valign="middle" align="center">26,723</td>
<td valign="middle" align="center">18,095</td>
<td valign="middle" align="center">37.97</td>
<td valign="middle" align="center">85</td>
<td valign="middle" align="center">37</td>
<td valign="middle" align="center">8</td>
<td valign="middle" align="center">130</td>
</tr>
<tr>
<td valign="middle" align="left">
<italic>Dodonaea viscosa</italic>
</td>
<td valign="middle" align="center">159,375</td>
<td valign="middle" align="center">87,205</td>
<td valign="middle" align="center">27,099</td>
<td valign="middle" align="center">17,972</td>
<td valign="middle" align="center">37.86</td>
<td valign="middle" align="center">85</td>
<td valign="middle" align="center">36</td>
<td valign="middle" align="center">8</td>
<td valign="middle" align="center">129</td>
</tr>
<tr>
<td valign="middle" align="left">
<italic>Eurycorymbus cavaleriei</italic>
</td>
<td valign="middle" align="center">158,777</td>
<td valign="middle" align="center">86,941</td>
<td valign="middle" align="center">26,922</td>
<td valign="middle" align="center">17,992</td>
<td valign="middle" align="center">37.92</td>
<td valign="middle" align="center">85</td>
<td valign="middle" align="center">36</td>
<td valign="middle" align="center">8</td>
<td valign="middle" align="center">129</td>
</tr>
<tr>
<td valign="middle" align="left">
<italic>Koelreuteria paniculata</italic>
</td>
<td valign="middle" align="center">163,258</td>
<td valign="middle" align="center">90,237</td>
<td valign="middle" align="center">27,376</td>
<td valign="middle" align="center">18,269</td>
<td valign="middle" align="center">37.30</td>
<td valign="middle" align="center">85</td>
<td valign="middle" align="center">37</td>
<td valign="middle" align="center">8</td>
<td valign="middle" align="center">130</td>
</tr>
<tr>
<td valign="middle" align="left">
<italic>Litchi chinensis</italic>
</td>
<td valign="middle" align="center">162,524</td>
<td valign="middle" align="center">85,751</td>
<td valign="middle" align="center">30,102</td>
<td valign="middle" align="center">16,569</td>
<td valign="middle" align="center">37.80</td>
<td valign="middle" align="center">87</td>
<td valign="middle" align="center">37</td>
<td valign="middle" align="center">8</td>
<td valign="middle" align="center">132</td>
</tr>
<tr>
<td valign="middle" align="left">
<italic>Pometia tomentosa</italic>
</td>
<td valign="middle" align="center">160,818</td>
<td valign="middle" align="center">85,667</td>
<td valign="middle" align="center">28,395</td>
<td valign="middle" align="center">18,361</td>
<td valign="middle" align="center">37.87</td>
<td valign="middle" align="center">87</td>
<td valign="middle" align="center">37</td>
<td valign="middle" align="center">8</td>
<td valign="middle" align="center">132</td>
</tr>
<tr>
<td valign="middle" align="left">
<italic>Sapindus mukorossi</italic>
</td>
<td valign="middle" align="center">160,481</td>
<td valign="middle" align="center">85,650</td>
<td valign="middle" align="center">27,979</td>
<td valign="middle" align="center">18,873</td>
<td valign="middle" align="center">37.66</td>
<td valign="middle" align="center">87</td>
<td valign="middle" align="center">37</td>
<td valign="middle" align="center">8</td>
<td valign="middle" align="center">132</td>
</tr>
<tr>
<td valign="middle" align="left">
<italic>Xanthoceras sorbifolium</italic>
</td>
<td valign="middle" align="center">161,231</td>
<td valign="middle" align="center">85,300</td>
<td valign="middle" align="center">28,619</td>
<td valign="middle" align="center">18,693</td>
<td valign="middle" align="center">37.69</td>
<td valign="middle" align="center">86</td>
<td valign="middle" align="center">38</td>
<td valign="middle" align="center">8</td>
<td valign="middle" align="center">132</td>
</tr>
<tr>
<td valign="middle" align="left">Average</td>
<td valign="middle" align="center">159,667.75</td>
<td valign="middle" align="center">86,139.50</td>
<td valign="middle" align="center">27,704.50</td>
<td valign="middle" align="center">18,119.33</td>
<td valign="middle" align="center">37.8</td>
<td valign="middle" align="center">85.58</td>
<td valign="middle" align="center">36.92</td>
<td valign="middle" align="center">8</td>
<td valign="middle" align="center">132.92</td>
</tr>
<tr>
<td valign="middle" align="left">Standard deviation (SD)</td>
<td valign="middle" align="center">2,319.68</td>
<td valign="middle" align="center">1,493.70</td>
<td valign="middle" align="center">1,147.41</td>
<td valign="middle" align="center">560.61</td>
<td valign="middle" align="center">0.18</td>
<td valign="middle" align="center">1.51</td>
<td valign="middle" align="center">0.51</td>
<td valign="middle" align="center">0</td>
<td valign="middle" align="center">1.88</td>
</tr>
<tr>
<td valign="middle" align="left">Coefficient of variation (CV)</td>
<td valign="middle" align="center">0.01</td>
<td valign="middle" align="center">0.02</td>
<td valign="middle" align="center">0.04</td>
<td valign="middle" align="center">0.03</td>
<td valign="middle" align="center">0.00</td>
<td valign="middle" align="center">0.02</td>
<td valign="middle" align="center">0.01</td>
<td valign="middle" align="center">0.00</td>
<td valign="middle" align="center">0.01</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>GS, chloroplast genome size; LSC, Large Single Copy region size; IR, Inverted Repeat regions size; SSC, Small Single Copy region size; GC (%), Guanine + Cytosine percentage.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>To identify the size of each region of the chloroplast genomes (Small Single Copy, Large Single Copy, and Inverted Repeats) and the genes located at their ends, Geneious Prime v. 2022.2.2 was used (<xref ref-type="bibr" rid="B32">Kearse et&#xa0;al., 2012</xref>). Identifying possible rearrangement and inversion events in chloroplast genomes was performed using the Mauve v. 2.4.0 program (<xref ref-type="bibr" rid="B14">Darling et&#xa0;al., 2004</xref>).</p>
<p>Identification of large genomic repeat structures (forward, reverse, palindromic, and complement) was conducted in the REPuter online version program (<xref ref-type="bibr" rid="B38">Kurtz et&#xa0;al., 2001</xref>), setting the minimum repeat size to 30 bp and a Hamming distance of 3 bp. Microsatellite regions (SSR) were identified using the MISA v2.1 web tool (<xref ref-type="bibr" rid="B7">Beier et&#xa0;al., 2017</xref>). For this, the minimum repeat numbers 10, 5, 4, 3, 3, and 3 were defined for the mononucleotide, dinucleotide, trinucleotide, tetranucleotide, pentanucleotide, and hexanucleotide repeats, respectively.</p>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Phylogenetic analysis</title>
<p>We performed three phylogenetic reconstructions: One for the Sapindaceae family to understand the phylogenetic relationship of <italic>S. erecta</italic> with other chloroplast genomes of the family; the other two phylogenies aimed to test whether the available molecular markers of chloroplast genomes together with the currently available <italic>S. erecta</italic> data are capable of clarifying the phylogenetic relationships of the genus <italic>Serjania</italic>.</p>
<p>For the phylogenetic reconstruction of the chloroplast genomes of the family Sapindaceae, 23 species were selected (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S1</bold>
</xref>), of which 22 species belonged to the order Sapindales and one species of the order Malvales (<italic>Gossypium hirsutum</italic>), used as an outgroup (external group) in rooting from the tree. Among the species of the order Sapindales, 16 belong to the Sapindaceae family (<italic>Serjania erecta</italic>, <italic>Acer buergerianum</italic>, <italic>Acer truncatum</italic>, <italic>Acer longipes</italic>, <italic>Aesculus chinensis</italic>, <italic>Aesculus wangii</italic>, <italic>Dimocarpus longan</italic>, <italic>Dipteronia sinensis</italic>, <italic>Dipteronia dyeriana</italic>, <italic>Dodonaea viscosa</italic>, <italic>Eurycorymbus cavaleriei</italic>, <italic>Koelreuteria paniculata</italic>, <italic>Litchi chinensis</italic>, <italic>Pometia tomentosa</italic>, <italic>Sapindus mukorossi</italic>, and <italic>Xanthoceras sorbifolium</italic>), two species belonging to the Meliaceae family (<italic>Khaya senegalensis</italic> and <italic>Cedrela odorata</italic>), two species of the Rutaceae family (<italic>Citrus sinensis</italic> and <italic>Ruta graveolens</italic>). <italic>Mangifera indica</italic> and <italic>Boswellia sacra</italic> were selected for the Anacardiaceae and Burseraceae families, respectively. The CDS of these species were obtained from GenBank. Seventy-four orthologous CDS were analyzed, retaining only one copy for each duplicated gene and excluding the <italic>rpl22</italic>, <italic>rps2</italic>, <italic>rps11</italic>, and <italic>rps19</italic> genes.</p>
<p>The CDS were aligned using MAFFT v.7 (<xref ref-type="bibr" rid="B31">Katoh and Standley, 2013</xref>) and concatenated using Sequence Matrix v.1.7.8 (<xref ref-type="bibr" rid="B70">Vaidya et&#xa0;al., 2011</xref>). The most informative regions for molecular phylogeny were selected using the Gblocks webserver (<xref ref-type="bibr" rid="B67">Talavera and Castresana, 2007</xref>). Phylogenetic reconstruction was performed using the maximum likelihood (ML) method in the IQ-TREE v.1.6.12 program (<xref ref-type="bibr" rid="B51">Nguyen et&#xa0;al., 2015</xref>). In the construction of the phylogenetic tree, 63979 bp were used, and the best model was selected using the ModelFinder (<xref ref-type="bibr" rid="B29">Kalyaanamoorthy et&#xa0;al., 2017</xref>) implemented in the IQ-TREE (<xref ref-type="bibr" rid="B51">Nguyen et&#xa0;al., 2015</xref>). The GTR+F+R3 model was selected, and the tree node support values were evaluated using the bootstrapping method with 1000 replicates.</p>
<p>The other two phylogenetic trees for the genus <italic>Serjania</italic> were constructed based on previously published marker data (<xref ref-type="bibr" rid="B9">Buerki et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B10">Buerki et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B3">Acevedo-Rodr&#xed;guez et&#xa0;al., 2017</xref>). These two phylogenies were predicted using the following data: the first using data from the <italic>matK</italic>, <italic>rpoB</italic>, <italic>trnD-trnT</italic>, <italic>trnK-matK</italic>, <italic>trnL</italic>(intron), and <italic>trnL-trnF</italic> markers and the second other information only from <italic>trnL</italic> (intron) (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S2</bold>
</xref>). For <italic>S. erecta</italic>, such regions were extracted from the chloroplast genome. In these phylogenies, we followed the same pipeline used in the ML tree of the CDS of chloroplast genomes. The best evolutionary model of nucleotide substitution for both trees was K3Pu+F.</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Nucleotide diversity and molecular evolution in Sapindaceae cpDNAs</title>
<p>In the analysis of nucleotide diversity, the same twelve species used in the comparative analyzes were used (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>), separating them into two groups: (1) formed by the 12 species of the Sapindaceae family and (2) a subgroup of 6 species belonging to the Sapindoideae subfamily. The genomes of the two groups were aligned using the MAFFT program (<xref ref-type="bibr" rid="B31">Katoh and Standley, 2013</xref>), and subsequently, the calculation of nucleotide diversity (&#x3c0;) was performed using the DnaSP v6 program defining windows of 600 bp and steps of 200 bp, (<xref ref-type="bibr" rid="B59">Rozas et&#xa0;al., 2017</xref>).</p>
<p>To understand the process of evolution of chloroplast genes, we calculated the ratios between non-synonymous and synonymous mutations (ka/ks). When higher than 1.0, this ratio suggests a positive selection process; when less than 1, it suggests a negative selection process; when equal to 1.0, it indicates the absence of selection (<xref ref-type="bibr" rid="B50">Nei and Kumar, 2000</xref>). The calculation was performed using the 77 CDS in common between the chloroplast genomes of the 12 species of Sapindaceae aligned in the MAFFT program (<xref ref-type="bibr" rid="B31">Katoh and Standley, 2013</xref>). The value of ka/ks was estimated considering two neutral models, one considering a phylogenetic tree (runmode = 0; model = 0; NSsites = 0) and the other only the pairwise relationship (runmode = -2; model = 0; NSsites = 0) and establishing a minimum number of four synonymous mutations, through the PAML v.4.9 program (<xref ref-type="bibr" rid="B78">Yang, 2007</xref>).</p>
<p>The presence of local positive selection (ka/ks &gt; 1) in all 77 genes was investigated, using the contrast between selection models and neutral models: (1) M2a (positive selection model) x M1a (model neutral); (2) M8 (positive selection model with beta distribution) x M7 (neutral model with beta distribution); (3) M8 (positive selection model with beta distribution) x M8a (null hypothesis model). To test the significance of the contracts, we calculated Likelihood Ratio Tests (LRT) and the False Discovery Rate (FDR), both in R language (<xref ref-type="bibr" rid="B56">R Core Team, 2020</xref>).</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>The chloroplast genome of <italic>Serjania erecta</italic>
</title>
<p>We generated 8.8 million paired-end reads to assemble the complete chloroplast genome sequence of <italic>S. erecta</italic>. This species has a chloroplast genome size of 159,297 bp (871x of average coverage) and a guanine + cytosine content (GC%) of 37.9% (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref> and <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). Furthermore, the <italic>S. erecta</italic> cpDNA has the typical quadripartite structure of Embryophyte chloroplasts with a Large Single Copy (LSC) region of 84,556 bp, a Small Single Copy (SSC) region of 18,057 bp, and two Inverted Repeat regions (IRa and IRb) of 28,342 bp separating the SSC and LSC regions (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref> and <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>).</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Chloroplast genomic map of <italic>Serjania erecta</italic> Radlk (Sapindaceae: Sapindoideae). The genes colored according to the functional group are represented in the outermost circle, the genes external to the circumference are transcribed in a counterclockwise direction, and the internal genes are transcribed in a clockwise direction (the gray arrows indicate the beginning). The inner circle represents Inverted Repeat regions (IRa and IRb), Large Single Copy (LSC), and Small Single Copy (SSC) regions. The bar graph corresponds to the GC content. The asterisk highlights genes with introns.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258794-g001.tif"/>
</fig>
<p>We annotated 132 genes and two pseudogenes (<italic>infA</italic> and <italic>ycf1</italic>) in the chloroplast genome of <italic>S. erecta</italic>, 87 protein-coding genes, and 45 functional RNAs (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref> and <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S3</bold>
</xref>). Among the protein-coding genes, nine genes are duplicated in the IR regions (<italic>rpl2</italic>, <italic>rpl22</italic>, <italic>rpl23</italic>, <italic>rps3</italic>, <italic>rps7</italic>, <italic>rps12</italic>, <italic>rps19</italic>, <italic>ndhB</italic>, and <italic>ycf2</italic>), nine genes have an intron (<italic>atpF</italic>, <italic>rpl2</italic>, <italic>rps12</italic>, <italic>rpl16</italic>, <italic>rps16</italic>, <italic>rpoC1</italic>, <italic>ndhA</italic>, <italic>ndhB</italic>, <italic>petB</italic>, and <italic>petD</italic>) and three genes have two introns (<italic>clpP</italic>, and <italic>ycf3</italic>) (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S1</bold>
</xref>). We also identified 37 tRNA genes and eight rRNA genes. Considering the tRNA genes, <italic>trnM-CAU</italic> has four copies, and <italic>trnA-UGC</italic>, <italic>trnE-UUC</italic>, <italic>trnL-CAA</italic>, <italic>trnN-GUU</italic>, <italic>trnR-ACG</italic>, and <italic>trnV-GAC</italic> have two copies each. Five tRNA genes contain an intron (<italic>trnA-UGC</italic>, <italic>trnK-UUU</italic>, <italic>trnL-UAA</italic>, <italic>trnT-CGU</italic>, and <italic>trnV-UAC</italic>). There are four types of rRNA genes in the <italic>S. erecta</italic> cpDNA (<italic>rrn4.5</italic>, <italic>rrn5</italic>, <italic>rrn16</italic>, and <italic>rrn23</italic>), and they are all located in the IR regions and are therefore duplicated (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S3</bold>
</xref>).</p>
<p>We identified 26,991 codons in the <italic>S. erecta</italic> chloroplast genome (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S4</bold>
</xref>). The most used were AAA (Lys) and ATT (Ile), representing 1,136 (4.20%) and 1,131 (4.19%) of the total codons, respectively. Among amino acids, the most frequent is leucine (Leu), with 2,835 amino acids (10.32% of total amino acids), followed by isoleucine (Ile) and Serine (Ser), with 2,280 amino acids (8.45% of total amino acids) and 2,068 amino acids (7.66% of total amino acids), respectively.</p>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Sapindaceae chloroplastidial genome structure</title>
<p>We performed a comparative analysis with the chloroplast genomes of <italic>S. erecta</italic> and 11 other cpDNAs from species of the Sapindaceae family. The chloroplast genome of <italic>S. erecta</italic> has a structure and genomic size similar to that of other Sapindaceae species (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>), standing out only as the species with the smallest LSC size, with 84,556 bp, which ranged up to a maximum length of 90,237 bp (<italic>Koelreuteria paniculata</italic>). The total size of chloroplast genomes ranged from 163,258 bp (<italic>K. paniculata</italic>) to 155,871 bp (<italic>Aesculus wangii</italic>). The mean GC content among the twelve Sapindaceae is 37.80%, with a standard deviation of 0.18 (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>).</p>
<p>The total number of genes in the chloroplast genomes of the family Sapindaceae ranges from 128 to 132. The most significant number of genes is described in five of the six species belonging to the subfamily Sapindoideae (<italic>Dimocarpus longan</italic>, <italic>Litchi chinensis</italic>, <italic>Pometia tomentosa</italic>, <italic>Sapindus mukorossi</italic>, and <italic>S. erecta</italic>) and in the species <italic>Xanthoceras sorbifolium</italic> (subfamily Xanthoceratoideae). The smallest number of genes was observed in the <italic>Acer buergerianum</italic> and <italic>A. wangii</italic>, both species belonging to the subfamily Hippocastanoideae (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>). Chloroplast genomes with fewer genes also had smaller IR sizes (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>), which ranged from 26,080 bp in <italic>A. buergerianum</italic> species to 30,102 bp in <italic>Litchi chinensis</italic>.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Variation in the number of genes in chloroplast genomes of the Sapindaceae family ordered by phylogeny. <italic>Acer buergerianum</italic> (Abu), <italic>Aesculus wangii</italic> (Awa), <italic>Dimocarpus longan</italic> (Dlo), <italic>Dipter dyeoniariana</italic> (Ddy), <italic>Dodonaea viscosa</italic> (Dvi), <italic>Eurycorymbus cavaleriei</italic> (Eca), <italic>Koelreuteria paniculata</italic> (Kpa), <italic>Litchi chinensis</italic> (Lch), <italic>Pometia tomentosa</italic> (Pto), <italic>Sapindus mukorossi</italic> (Smu), <italic>Serjania erecta</italic> (Ser), and <italic>Xanthoceras sorbifolium</italic> (Xso).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258794-g002.tif"/>
</fig>
<p>All Sapindaceae species analyzed showed the same four rRNA genes (<italic>rrn4.5</italic>, <italic>rrn5</italic>, <italic>rrn16</italic>, and <italic>rrn23</italic>) duplicated in the IRa and IRb regions. The tRNA genes ranged from 38 genes in <italic>X. sorbifolium</italic> to 36 genes identified in the two species of the subfamily Dodonaeoideae (<italic>Dodonaea viscosa</italic> and <italic>Eurycorymbus cavaleriei</italic>). Furthermore, it is possible to observe specific genomic patterns in the analyzed genomes, such as the duplication of the <italic>trnH-GUG</italic> gene in the <italic>X. sorbifolium</italic> genome and the deletion of the <italic>trnT-CGU</italic> gene in the Dodonaeoideae subfamily (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>). There were no differences regarding the number of introns in the genes of the 12 species of the Sapindaceae family (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S5</bold>
</xref>).</p>
<p>The genes that flank the borders of the chloroplast genome regions were identified to observe patterns related to the presence and position of genes (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>). Four distinct patterns appear in the border region between LSC and IRb: i) Patterns 1 - LSC-IRb flanked by the rpl16 and rps3 genes, in the species <italic>D. longan</italic>, <italic>L. chinensis</italic>, <italic>P. tomentosa</italic>, <italic>S. mukorossi</italic>, <italic>S. erecta</italic>, and <italic>X. sorbifolium</italic>; ii) Patterns 2 - LSC-IRb flanked by the <italic>rp122</italic> and <italic>rps19</italic> genes, was identified in the species <italic>D. viscosa</italic>, <italic>E. cavaleriei</italic>, and <italic>K. paniculatai</italic>; iii) Patterns 3 - LSC-IRb flanked by the <italic>rps19</italic> and <italic>rpl2</italic> genes, was identified in <italic>A. buergerianum</italic> and <italic>A. wangii</italic>; and iv)Patterns 4 - LSC-IRb in a single <italic>D. dyeriana</italic> species, flanked by the <italic>rps3</italic> and <italic>rpl22</italic> genes.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Comparison between the borders of the regions that delimit the chloroplast genomes of species from the Sapindaceae family. Inverted repeat regions (IRa and IRb) are represented in blue, the large single-copy region (LSC) in green, and the small single-copy region (SSC) in yellow. The white boxes above the bars represent counterclockwise transcribed genes, and those below represent clockwise transcribed genes. The gray boxes represent pseudogenes.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258794-g003.tif"/>
</fig>
<p>Five distinct patterns were identified in the border region between IRa and LSC. In Standard 1, the LSC-IRa region is flanked by <italic>rps3</italic> and <italic>trnH</italic> in the species <italic>D. longan</italic>, <italic>L. chinensis</italic>, <italic>P. tomentosa</italic>, <italic>S. mukorossi</italic>, and <italic>S. erecta</italic>. The <italic>X. sorbifolium</italic> species is the only one where the IRa-LSC region is flanked by <italic>rps3</italic> and <italic>psbA</italic>, being the pattern 5 (IRa-LSC). pattern 2 (<italic>trnH</italic> and <italic>rps19</italic>), pattern 3 (<italic>trnH</italic> and <italic>rpl2</italic>), and patterns 4 (<italic>trnH</italic> and <italic>rpl22</italic>) (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>). The same genes in all species flanked the transition regions between IR and SSC: between IRb and SSC by pseudogenized <italic>ycf1</italic> and <italic>ndhF</italic> and between SSC and IRa by the <italic>ycf1</italic> gene (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>).</p>
<p>We identified only one chloroplast genome rearrangement event for the twelve Sapindaceae species analyzed, which resulted in the unique genomic organization of the cpDNA of <italic>K. paniculata</italic> (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S1</bold>
</xref>). In total, we identified three syntenic blocks that are divided due to a region located in the IRa of <italic>K. paniculata</italic>, which is in the reverse complementary orientation compared to the other species (block in green, <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S1</bold>
</xref>).</p>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Repetitive portions of the chloroplastidial genome of Sapindaceae</title>
<p>The number of large repeats among the 12 species in the comparative analysis ranged from 24 in S. erecta to 119 in <italic>K. aniculate</italic> (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>). In the Sapindaceae family, it was possible to find the four types of large repeats (forward, reverse, complement, and palindromic) in only four species, and the most frequent types were forward and palindromic. The large repeats are generally found in the LSC regions, followed by the IR, and less often in the SSC region in all species but <italic>D. viscosa</italic> (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4B</bold>
</xref>).</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Distribution of repeats in the chloroplast genomes of twelve species of the Sapindaceae family. <bold>(A)</bold> Distribution of large repeats by type. <bold>(B)</bold> Distribution of large repeats according to their region in the chloroplast genome. <bold>(C)</bold> Distribution of SSRs according to repetition motif. <bold>(D)</bold> Distribution of SSRs according to their region in the chloroplast genome.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258794-g004.tif"/>
</fig>
<p>
<italic>S. erecta</italic> has the lowest number of SSRs, and <italic>Sapindus mukorossi</italic> has the highest number among all the analyzed Sapindaceae species, with 58 and 91 SSR repeats, respectively (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4C</bold>
</xref>). Mononucleotide SSR repeats were the most abundant in all species. The SSRs are mainly located in the LSC and less frequently in the IR in all species (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4D</bold>
</xref>).</p>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Molecular evolution in chloroplast genomes of Sapindaceae</title>
<p>We reconstructed a phylogenetic tree of the Sapindaceae family using a 68,917 bp hypermatrix composed of nucleotides of 74 orthologue protein-coding genes in the chloroplast genomes of the 23 species analyzed. The phylogenetic analysis resulted in a tree with high support values for the nodes, except for the branching between the family Sapindaceae and the clade formed by the families Rutaceae and Meliaceae (bootstrap support value = 50) (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>). In the Sapindaceae family, it was possible to identify the four monophyletic clades formed by the four subfamilies: Sapindoideae, Dodonaeoideae, Hippocastanoideae, and Xanthoceroideae, in agreement with the topologies proposed by <xref ref-type="bibr" rid="B9">Bueki et&#xa0;al. (2009)</xref>; <xref ref-type="bibr" rid="B8">Bueki et&#xa0;al. (2021)</xref>; <xref ref-type="bibr" rid="B3">Acevedo-rodr&#xed;guez et&#xa0;al. (2017)</xref>, and Angiosperm Phylogeny Group (APG) IV (<xref ref-type="bibr" rid="B12">Chase et&#xa0;al., 2016</xref>). The phylogeny for the genus <italic>Serjania</italic> also presented itself as a monophyletic clade, concordant with the taxonomic changes that suggested the inclusion of different genera as <italic>Serjania</italic>, proposed by <xref ref-type="bibr" rid="B3">Acevedo-Rodr&#xed;guez et&#xa0;al. (2017)</xref> (e.g., <italic>Balsas guerrerensis</italic> as <italic>Serjania guerrerensis</italic> (Cruz Dur&#xe1;n &amp; K.Vega) Acev.-Rodr.; <italic>Houssayanthus biternatus</italic> as <italic>Serjania biternata</italic> (Weath.) Acev.-Rodr.; <italic>Houssayanthus incanus</italic> as <italic>Serjania incana</italic> Radlk.) (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S2</bold>
</xref>). Our phylogenetic tree is also similar to the reconstruction obtained by <xref ref-type="bibr" rid="B500">Steinmann et&#xa0;al. (2022)</xref>, which was based on nuclear ITS and chloroplast trnL-F sequences (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures S2A, B</bold>
</xref>).</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>The phylogenetic tree of the Sapindaceae family was obtained by the maximum likelihood (ML) method and proposed using 74 protein-coding genes and nucleotide sequences from the chloroplast genomes of 23 species. Numbers on the nodes represent the Bootstrap values obtained from 1000 replicates. Additionally, species from Rutaceae, Meliaceae, Burseraceae, and Anacardiaceae were added. Malvales order were used as outgroups.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258794-g005.tif"/>
</fig>
<p>The nucleotide diversity (&#x3c0;) ranged from 0.0008 to 0.1473 for the Sapindaceae family, with a median of 0.0357 (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6A</bold>
</xref> and <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S6</bold>
</xref>). For the subfamily Sapindoideae, the variation of nucleotide diversity was from 0 to 0.0974, with a median of 0.0227 (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6B</bold>
</xref> and <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S7</bold>
</xref>). Nucleotide diversity hotspots were defined as sites with values above twice the median. For the Sapindaceae family we identified ten nucleotide diversity hotspots (<italic>tRNA-Lys</italic> &#x2013; <italic>rps16</italic>, <italic>atpI &#x2013; rps2</italic>, <italic>rpoB</italic> &#x2013; <italic>tRNA-Asp</italic>, <italic>tRNA-Tyr</italic> &#x2013; <italic>psbD</italic>, <italic>psbZ</italic>, <italic>ndhC</italic> &#x2013; <italic>tRNA-Val</italic>, <italic>petA</italic> &#x2013; <italic>psbJ</italic>, <italic>ndhF</italic>, <italic>rpl32 &#x2013; cssA</italic>, and <italic>ycf1</italic>) (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6A</bold>
</xref>), and for the Sapindoideae subfamily we identified 11 nucleotide diversity hotspots (<italic>tRNA-Lys &#x2013; rps16</italic>, <italic>rps16 &#x2013; tRNA-Gln</italic>, <italic>tRNA-Ser &#x2013; tRNA-Gly</italic>, <italic>tRNA-Cys &#x2013; psbM</italic>, <italic>ndhC &#x2013; tRNA-Val</italic>, <italic>ycf4 &#x2013; cemA</italic>, <italic>petA &#x2013; psbJ</italic>, <italic>psbE &#x2013; petL</italic>, <italic>ndhF</italic>, <italic>rpl32 &#x2013; cssA</italic>, and <italic>ycf1</italic>) (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6B</bold>
</xref>). <italic>tRNA-Lys &#x2014; rps16</italic>, <italic>ndhC &#x2013; tRNA-Val, petA &#x2013; psbJ</italic>, <italic>ndhF</italic>, <italic>rpl32 &#x2013; ccsA</italic>, and <italic>ycf1</italic> are hotspots for both Sapindaceae family and Sapindoideae subfamily.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Nucleotide and mutational variation in chloroplast genomes of Sapindaceae family: <bold>(A)</bold> Distribution of nucleotide diversity along the chloroplast genomes of twelve species of the Sapindaceae family. <bold>(B)</bold> Distribution of nucleotide diversity along the chloroplast genomes of six species of the subfamily Sapindoideae. <bold>(C)</bold> Relation of non-synonymous mutations and synonymous mutations (ka/ks) for the 77 protein-coding genes found in all chloroplast genomes from the twelve species of the Sapindaceae family. The solid red line in graphs <bold>(A)</bold> and <bold>(B)</bold> indicates twice the chloroplast genome&#x2019;s median nucleotide diversity (&#x3c0;) values. The dashed red line indicates the value at which the ka/ks ratio equals 1.0, and the dashed blue line indicates the value at which the ka/ks ratio equals 0.5.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258794-g006.tif"/>
</fig>
<p>The mean values of the ratios of non-synonymous mutations and synonymous mutations (ka/ks) were 0.2160 (SD = 0.19), ranging from 0.001 for the <italic>atpH</italic>, <italic>petN</italic>, <italic>psaC</italic>, and <italic>psbL</italic> genes to 1.032 for the <italic>psaI</italic> gene (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6C</bold>
</xref>). We did not identify any gene with ka/ks values significantly greater than 1.0. Only the <italic>psaI</italic> gene showed a ratio close to 1, demonstrating that of the 77 common genes of chloroplast genomes, 76 genes are under strong negative selection.</p>
<p>To understand how natural selection works in different species in pair-by-pair comparisons, the genes with the highest ka/ks values in each of the functional groups of genes were selected (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7</bold>
</xref>). For the <italic>rpl23</italic> and <italic>psaI</italic> genes (<xref ref-type="fig" rid="f7">
<bold>Figures&#xa0;7A, B</bold>
</xref>), outliers (NA) were identified, that is, genes in which the ka/ks ratios did not show the defined minimum number of synonymous mutations. The <italic>ndhB</italic> and <italic>ycf2</italic> genes (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6C</bold>
</xref>) showed the highest values of ka/ks ratio for the categories of NADH dehydrogenase and &#x201c;other genes&#x201d;, respectively, showing punctual, positive selection relationships (<xref ref-type="fig" rid="f7">
<bold>Figures&#xa0;7C, D</bold>
</xref>). In particular, <italic>S. erecta</italic> displayed the <italic>psaI</italic> gene with ka/ks values greater than 1 for 7 of the 11 species that were pairwise compared (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7B</bold>
</xref>).</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Relationships between pairwise non-synonymous and synonymous (ka/ks) mutations, considering the chloroplast protein-coding genes of 12 species of Sapindaceae. <bold>(A)</bold> Heatmap for the <italic>rpl23</italic> gene (Self-replication). <bold>(B)</bold> Heatmap for the <italic>psaI</italic> gene (photosynthesis). <bold>(C)</bold> Heatmap for the <italic>ndhB</italic> gene (NADH dehydrogenase). <bold>(D)</bold> Heatmap for the <italic>ycf2</italic> gene (other genes). Values equal to NA represent outliers, genes with fewer synonymous mutations than necessary for calculating ka/ks. <italic>Acer buergerianum</italic> (Abu), <italic>Aesculus wangii</italic> (Awa), <italic>Dimocarpus longan</italic> (Dlo), <italic>Dipter dyeoniariana</italic> (Ddy), <italic>Dodonaea viscosa</italic> (Dvi), <italic>Eurycorymbus cavaleriei</italic> (Eca), <italic>Koelreuteria paniculata</italic> (Kpa), <italic>Litchi chinensis</italic> (Lch), <italic>Pometia tomentosa</italic> (Pto<italic>), Sapindus mukorossi</italic> (Smu), <italic>Serjania erecta</italic> (Ser), and <italic>Xanthoceras sorbifolium</italic> (Xso).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258794-g007.tif"/>
</fig>
<p>We identified local positive selection signals for the three tested contrasts evidenced based on LTR and FDR (M2a x M1a; (2) M8 x M7; and (3) M8 x M8a) (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S8</bold>
</xref>). Among these, the contrast between the M8 x M7 models showed the highest number of genes under local positive selection with 12 genes (<italic>atpA</italic>, <italic>clpP</italic>, <italic>matK</italic>, <italic>ndhA</italic>, <italic>ndhF</italic>, <italic>petD</italic>, <italic>psaB</italic>, <italic>rpl32</italic>, <italic>rpoB</italic>, <italic>rpoC2</italic>, <italic>ycf1</italic>, and <italic>ycf2</italic>). As for the contrasts between the M2a x M1a and M8 x M8a models, we identified positive local selection for four genes (<italic>ndhF</italic>, <italic>rpoC2</italic>, <italic>ycf1</italic>, and <italic>ycf2</italic>). The <italic>psaI</italic> gene was the only one that showed neutral evolution (ka/ks&#x2245;1) and showed significant positive selection for the LTR test.</p>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>The chloroplast genomes of the family Sapindaceae have a relatively conserved structure for the twelve species studied (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). They show slight variation in genome size and GC content. Among the regions of the plastid genomes, the IRs showed the highest variation, with variation in the genes that flank the transition between the LSC and IR regions being associated with gene abundance (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>; <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>). These results suggest that IR expansion and retraction events are an essential source of variation in the number of genes in the Sapindaceae family, with a possible phylogenetic relationship. The <italic>S. erecta</italic> cpDNA has genomic size, structure, number of genes, and GC content within the range expected for chloroplast genomes of the family Sapindaceae (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). The GC content value for this species is most similar to that described for <italic>Dodonaea viscosa</italic> and <italic>Acer buergerianum</italic>. Among the twelve species analyzed, the GC content was highly conserved, as described so far for the Sapindaceae family (<xref ref-type="bibr" rid="B60">Saina et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B45">Ma et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B17">Dong et&#xa0;al., 2021</xref>)</p>
<p>A slight variation in the size of the four regions of the chloroplast genomes (LSC, SSC, IRa, and IRb) was observed, considering the coefficient of variation (CV), the sizes of the IRs (CV=0.04) and SSC (CV=0.03) varied more than the LSC (CV=0.01), which is an expected pattern for land plants (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). (<xref ref-type="bibr" rid="B77">Xiao-Ming et&#xa0;al., 2017</xref>). This variation is related to expansion and retraction events in the size of IRs, events already described in members of the Sapindaceae family and other angiosperms as an essential evolutionary mechanism in land plants (<xref ref-type="bibr" rid="B20">Dugas et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B43">Li et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B60">Saina et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B72">Wang et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B45">Ma et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B17">Dong et&#xa0;al., 2021</xref>).</p>
<p>The number of genes in the chloroplast genomes of the Sapindaceae family is consistent with previously published studies (<xref ref-type="bibr" rid="B17">Dong et&#xa0;al., 2021</xref>), suggesting that this variability in the number of genes is due to three factors: the expansion and retraction in the size of the IRs, the process of pseudogenization of the <italic>rps2</italic> gene, and the mobility of the tRNA genes (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>). The evidence of expansion and retraction processes in the IR regions comes from the gene colinearity in the transition of the IR regions with the LSC and SSC regions (<xref ref-type="bibr" rid="B43">Li et&#xa0;al., 2017</xref>). Thus, the identified patterns provide evidence for a possible phylogenetic relationship between the IR expansion and contraction events with the number of genes. The genes <italic>rpl22</italic>, <italic>rps19</italic>, and <italic>rps3</italic>, located in the IR in the subfamily Sapindoideae, except for the most basal species <italic>Koelreuteria paniculata</italic> (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>), are part of a set of genes encoding ribosomal proteins (<xref ref-type="bibr" rid="B501">Christopher et&#xa0;al., 1988</xref>). Among these three genes, the <italic>rps19</italic> gene is commonly found in the IR in dicotyledons, although in other families, such as Euphorbiaceae, this gene can be found in both the IR and LSC regions (<xref ref-type="bibr" rid="B43">Li et&#xa0;al., 2017</xref>). The <italic>rpl22</italic> gene, found in the chloroplast genomes of angiosperms except for the Fabaceae family, is located in the IR of the Rutaceae family (order Sapindales), indicating IR expansion events (<xref ref-type="bibr" rid="B23">Gantt et&#xa0;al., 1991</xref>; <xref ref-type="bibr" rid="B6">Bausher et&#xa0;al., 2006</xref>). Previous studies for the Sapindaceae family also showed expansion and retraction processes in the LSC-IRb region, occurring even within genera of the Sapindaceae family, highlighting that the IR expansion and retraction events are an essential source of variability in the number of genes in the Sapindaceae (<xref ref-type="bibr" rid="B43">Li et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B77">Xiao-Ming et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B60">Saina et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B45">Ma et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B36">K&#xf6;hler et&#xa0;al., 2020</xref>).</p>
<p>The <italic>rps2</italic> gene produces the 2S ribosomal protein and is pseudogenized in Hippocastanoideae and Xanthoceratoideae subfamilies (<xref ref-type="bibr" rid="B82">Zhou et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B13">Chen et&#xa0;al., 2019</xref>). This gene is often under positive selection in other angiosperm families and is located near a nucleotide diversity hotspot (<italic>atpI-rps2</italic>). Therefore, the accumulation of nonsynonymous mutations may have led to the pseudogenization of this gene (<xref ref-type="bibr" rid="B76">Wu et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B41">Li et&#xa0;al., 2020a</xref>; <xref ref-type="bibr" rid="B42">Li et&#xa0;al., 2020b</xref>; <xref ref-type="bibr" rid="B63">Sobreiro et&#xa0;al., 2020</xref>). The <italic>trnH-GUG</italic> gene is located exclusively in internal regions of the IRs in <italic>X. sorbifolium</italic>, so this duplication may not be associated with IR expansion events (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>). Furthermore, other variations in genes encoding tRNAs have been identified, as the absence of <italic>trnT-CGU</italic> genes in <italic>Eurycorymbus cavariei</italic> has already been described (<xref ref-type="bibr" rid="B17">Dong et&#xa0;al., 2021</xref>). The chloroplasts of <italic>D. viscosa</italic> show the same absence, perhaps indicating a synapomorphy of the subfamily Dodonaeoideae (<xref ref-type="bibr" rid="B17">Dong et&#xa0;al., 2021</xref>). The <italic>trnT-CGU</italic> gene is not the only gene encoding threonine transporter RNAs, and its absence may be supplied by the other two threonine transporter RNAs in the subfamily Dodonaeoideae.</p>
<p>There is a high level of gene conservation in the cpDNAs of the Sapindaceae family, all of which have the same number of introns. The <italic>clpP</italic>, <italic>rps12</italic>, and <italic>ycf3</italic> genes have two introns and were observed in all annotated species, unlike some annotations that did not identify the <italic>rps12</italic> gene (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S5</bold>
</xref>). The <italic>rps12</italic> gene has two 3&#x2019; exons in the IR and one 5&#x2019; exon in the LSC and is a trans-spliced gene. The trans-spliced <italic>rps12</italic> gene has been reported in several Viridiplantae. In some taxonomic groups, such as ferns, one intron of <italic>rps12</italic> has been lost (<xref ref-type="bibr" rid="B25">Hildebrand et&#xa0;al., 1988</xref>; <xref ref-type="bibr" rid="B45">Ma et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B63">Sobreiro et&#xa0;al., 2020</xref>). We identified two pseudogenes (<italic>infA</italic> and one of the <italic>ycf1</italic> copies) in all Sapindaceae species. The <italic>infA</italic> gene is a mobile gene that has undergone several transfer events from the chloroplast to the nucleus, mainly in lineages of the Rosid clade (<xref ref-type="bibr" rid="B47">Millen et&#xa0;al., 2001</xref>). Pseudogenization of one of the ycf1 copies is common in angiosperm chloroplast genomes and occurs due to its location in the transition zone between the IR and SSC regions (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>) (<xref ref-type="bibr" rid="B43">Li et&#xa0;al., 2017</xref>).</p>
<p>Among the species we identified repetitive regions, <italic>K. paniculata</italic> and <italic>S. erecta</italic> had the highest and lowest amounts of wide repeats, respectively. <italic>Sapindus mukorossi</italic> and <italic>S. erecta</italic> are the species with the highest and lowest amounts of microsatellite repeats (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>), respectively, confirming a previous study highlighting that <italic>S. mukorossi</italic> has large numbers of repetitive regions in its chloroplast (<xref ref-type="bibr" rid="B17">Dong et&#xa0;al., 2021</xref>). Such repetitive regions are highly informative about genetic diversity within species and are commonly used as molecular markers in studies of biogeography and population genetics (<xref ref-type="bibr" rid="B71">Varshney et&#xa0;al., 2005</xref>).</p>
<p>Leucine and cysteine are the most and least abundant amino acids constituting the proteins of the <italic>S. erecta</italic> chloroplast genome (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S5</bold>
</xref>), as previously described in other species of Sapindaceae and angiosperms (<xref ref-type="bibr" rid="B49">Muellner-Riehl et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B45">Ma et&#xa0;al., 2019</xref>). The predominant use of some amino acids in chloroplasts may be related to the conservation of genes encoding tRNAs since the composition and number of tRNAs affect the codon composition (<xref ref-type="bibr" rid="B52">Novoa et&#xa0;al., 2012</xref>).</p>
<p>The ka/ks ratio is a valuable analysis for understanding the evolutionary process within genes, so values greater than 1 (Ka/Ks &gt; 1) indicate positive selection, values equal to 1 (Ka/Ks = 1) indicate neutrality and values less than 1 (Ka/Ks &lt; 1) indicate negative selection (<xref ref-type="bibr" rid="B50">Nei and Kumar, 2000</xref>). We found no evidence of positive selection for any of the cpDNA protein-coding genes (ka/ks &gt; 1) (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6C</bold>
</xref>). Only the <italic>psaI</italic> gene is under neutrality, indicating a high conservation of amino acid sequences produced by chloroplast protein-coding genes in Sapindales. The <italic>psaI</italic> gene makes up subunit VIII of the photosystem I reaction center and showed evidence of local positive selection in other studies (<xref ref-type="bibr" rid="B55">Pl&#xf6;chinger et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B62">Sch&#xf6;ttler et&#xa0;al., 2017</xref>). Previous tests in <italic>Nicotiana tabacum</italic>, inducing mutations in this gene, did not cause changes in plant growth and only responded to high light and cold stress during leaf senescence (<xref ref-type="bibr" rid="B62">Sch&#xf6;ttler et&#xa0;al., 2017</xref>). Although <italic>psaI</italic> is the only gene under neutral evolution, several of the ka/ks relationships did not show synonymous mutations (ka), and the highest values of the relationships are primarily associated with <italic>S. erecta</italic> genes (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7B</bold>
</xref>). A pairwise comparison of <italic>S. erecta</italic> with the other species for the <italic>psaI</italic> gene shows an accumulation of non-synonymous mutations in this species, indicating possible positive selection. This heterogeneous speciation process in the <italic>psaI</italic> gene may be associated with evolutionary factors of the tribe or species. The <italic>S. erecta</italic> is the unique Sapindaceae liana with data available; positive selection for <italic>psaI</italic> may be linked to this habit, as this gene is associated with responses to light and cold. We suggest that comparisons of this gene with orthologous genes from species closer to <italic>S. erecta</italic> are needed to assess the evolutionary impact of these non-synonymous mutations.</p>
<p>The contrasts between the M8 x M7 models identified 12 genes (<italic>atpA</italic>, <italic>clpP</italic>, <italic>matK</italic>, <italic>ndhA</italic>, <italic>ndhF</italic>, <italic>petD</italic>, <italic>psaB</italic>, <italic>rpl32</italic>, <italic>rpoB</italic>, <italic>rpoC2</italic>, <italic>ycf1</italic>, and <italic>ycf2</italic>) under local positive selection (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S8</bold>
</xref>), among these genes one is an ATP subunit (<italic>atpA</italic>), one encodes a protease (<italic>clpP</italic>), one encodes maturase (<italic>matK</italic>), two encodes NADH dehydrogenase subunits (<italic>ndhA</italic> and <italic>ndhF)</italic>, one composes the Cytochrome b/f complex (<italic>petD</italic>), one encodes a Photosystem I subunit (<italic>psaB</italic>), one encode a ribosomal protein subunit (<italic>rpl32</italic>), two encode DNA-directed RNA polymerase subunits (<italic>rpoB</italic> and <italic>rpoC2)</italic>, and two encode protein translocons on the inner chloroplast membrane (<italic>ycf1</italic> and <italic>ycf2</italic>) (<xref ref-type="bibr" rid="B4">Allen et&#xa0;al., 2011</xref>). The M2a x M1a and M8 x M8a contrasts, which are more rigorous in identification and identified four genes (<italic>ndhF</italic>, <italic>rpoC2</italic>, <italic>ycf1</italic>, and <italic>ycf2</italic>) under local positive selection (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S8</bold>
</xref>) (<xref ref-type="bibr" rid="B79">Yang and Swanson, 2002</xref>; <xref ref-type="bibr" rid="B66">Swanson et&#xa0;al., 2003</xref>). The <italic>ndhF</italic> gene encodes NADH dehydrogenase F and is present in most vascular plants. Positive selection of this gene is associated with adaptation to greater light incidence at high altitudes in <italic>Silene vulgaris</italic> (Caryophyllaceae) and salt stress in species of the genus <italic>Limonium</italic> (Plumbaginaceae), suggesting that these loci under positive selection may be related to adaptation in Sapindaceae (<xref ref-type="bibr" rid="B37">Kr&#xfc;ger et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B15">Darshetkar et&#xa0;al., 2021</xref>). The gene rpoC2 is a crucial gene for the transcription of photosynthesis genes, and mutations in these genes can confer the albino phenotype(<xref ref-type="bibr" rid="B54">Park et&#xa0;al., 2023</xref>). The <italic>ycf1</italic> and <italic>ycf2</italic> are essential plant genes for photosynthetic protein import and plant survival (<xref ref-type="bibr" rid="B35">Kikuchi et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B34">Kikuchi et&#xa0;al., 2018</xref>). Previous studies also showed local positive selection in the <italic>ycf1</italic> and <italic>ycf2</italic> genes, both in angiosperm and gimonosperm, related to adaptation to environmental changes (<xref ref-type="bibr" rid="B21">Fan et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B80">Zeb et&#xa0;al., 2019</xref>). In addition, previous studies without considering the phylogeny indicated positive selection of the ycf2 gene and may, in addition to having loci on positive selection, present clades with a more significant amount of non-synonymous mutations (<xref ref-type="bibr" rid="B60">Saina et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B17">Dong et&#xa0;al., 2021</xref>).</p>
<p>Previous phylogenies reported for the genus <italic>Serjania</italic> using data from molecular markers (ITS and trnL intron) indicated the formation of a paraphyletic genus with the inclusion of species from the genera <italic>Balsas</italic>, <italic>Chimborazoa</italic> and <italic>Houssayanthus</italic> (<xref ref-type="bibr" rid="B3">Acevedo-Rodr&#xed;guez et&#xa0;al., 2017</xref>). Thus, using molecular information as support, <xref ref-type="bibr" rid="B3">Acevedo-Rodr&#xed;guez et&#xa0;al. (2017)</xref> suggest that the group has changed to include the genera <italic>Balsas</italic>, <italic>Chimborazoa</italic>, and <italic>Houssayanthus</italic> in <italic>Serjania</italic>, forming a monophyletic group. Speciation events within the genus have probably occurred during the Neogene, resulting in over 230 species distributed throughout the Neotropics. The high level of diversification may be related to the ability to disperse seeds by wind (<xref ref-type="bibr" rid="B49">Muellner-Riehl et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B3">Acevedo-Rodr&#xed;guez et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B8">Buerki et&#xa0;al., 2021</xref>) and the emergence of climbing species on lianas. South American Sapindaceae species, especially lianas, show a distribution across Antarctica that occurred during the Middle Eocene (about 44 million years ago) (<xref ref-type="bibr" rid="B8">Buerki et&#xa0;al., 2021</xref>) and diversified about 18.5-19 million years ago (<xref ref-type="bibr" rid="B28">Jud et&#xa0;al., 2021</xref>).</p>
<p>Investigation of nucleotide diversity among families and subfamilies allowed the identification of hotspots of genetic diversity, which can be used as molecular markers to resolve intraspecific relationships and as barcoding markers. In general, intergenic spaces show higher nucleotide diversity, while gene regions are more conserved in species, results like those found by the Percentage of variable characters in embryophytes (<xref ref-type="bibr" rid="B81">Zhang et&#xa0;al., 2011</xref>; <xref ref-type="bibr" rid="B21">Fan et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B80">Zeb et&#xa0;al., 2019</xref>). Our results indicate 10 and 11 nucleotide diversity hotspots for Sapindaceae and Sapindoideae; among these six hotspots (<italic>tRNA-Lys</italic> &#x2014; <italic>rps16</italic>, <italic>ndhC</italic> &#x2013; <italic>tRNA-Val</italic>, <italic>petA</italic> &#x2013; <italic>psbJ</italic>, <italic>ndhF</italic>, <italic>rpl32</italic> &#x2013; <italic>ccsA</italic>, and <italic>ycf1</italic>) are in common for both tribe and family (<xref ref-type="fig" rid="f6">
<bold>Figures&#xa0;6A, B</bold>
</xref>). Other studies evaluating nucleotide diversity also indicate the petA-psbJ, rpl32-cssA, ndhF, and ycf1 regions as highly diverse regions, so we strongly suggest using these regions as molecular markers of the group (<xref ref-type="bibr" rid="B82">Zhou et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B45">Ma et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B17">Dong et&#xa0;al., 2021</xref>). Only the <italic>ndhF</italic> and <italic>ycf1</italic> genes showed high nucleotide diversity, genes in which local positive selection was also found (<xref ref-type="fig" rid="f6">
<bold>Figures&#xa0;6A, B</bold>
</xref>, and <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S8</bold>
</xref>), which have already been described and used as molecular markers capable of distinguishing angiosperm and gymnosperm species, with great potential for the family of this study (<xref ref-type="bibr" rid="B18">Dong et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B21">Fan et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B80">Zeb et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B5">Amar, 2020</xref>; <xref ref-type="bibr" rid="B57">Ram&#xed;rez-Barahona et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B17">Dong et&#xa0;al., 2021</xref>).</p>
<p>The availability of data from chloroplast genomes for the <italic>Serjania</italic> genus can help develop future molecular markers specific to this genus, which can be applied to the definition of interspecific relationships in the genus. However, a more significant number of genomes from phylogenetically close species is required. Although only one chloroplast genome of the genus <italic>Serjania</italic> has been described, the two gene regions have the potential as markers for phylogenetic studies. They can be used to clarify evolutionary issues of the genus. These include modifying vegetational habits associated with the diversification of the group in lianas and fruit shape (<xref ref-type="bibr" rid="B28">Jud et&#xa0;al., 2021</xref>). In addition, they have the potential to be used as markers and DNA barcodes in the molecular taxonomic identification of species, providing very useful tools in the certification of natural medicines, as is the case with species of the genus <italic>Serjania</italic>.</p>
</sec>
<sec id="s5" sec-type="conclusions">
<label>5</label>
<title>Conclusion</title>
<p>Our study provides the first assembly and annotation of a chloroplast genome of a species from the tribe Paullinieae (Sapindaceae), <italic>Serjania erecta</italic>. Three factors are associated with variation in the number of genes in the chloroplast genomes of sapindaceae: (1) expansion events in the IR, (2) pseudogenization of the <italic>rps2</italic> gene, and (3) absence and duplication of genes of tRNAs. Protein-coding genes are highly conserved in the Sapindaceae family, and only the <italic>psaI</italic> gene is evolving under neutrality. We recommend six regions (<italic>tRNA-Lys &#x2014; rps16, ndhC &#x2013; tRNA-Val, petA &#x2013; psbJ, ndhF, rpl32 &#x2013; ccsA, and ycf1</italic>) with potential used as a marker for both Sapidaceae and Sapindoideae. The genes <italic>ycf1</italic> and <italic>ndhF</italic>, in addition to showing high nucleotide diversity, also show positive local selection. Our work provides evidence that the <italic>ycf1</italic> and <italic>ndhF</italic> genes may be the most suitable markers for phylogenetic studies of the subfamily Sapindoideae and may contribute to the resolution of taxonomic uncertainties in this group.</p>
</sec>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found below: <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/">https://www.ncbi.nlm.nih.gov/</ext-link>, SRX18977468, <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/">https://www.ncbi.nlm.nih.gov/</ext-link>, NC_072944.1.</p>
</sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>LCJC: Data curation, Formal Analysis, Investigation, Methodology, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. MS: Formal Analysis, Methodology, Software, Writing &#x2013; review &amp; editing. LRC: Formal Analysis, Investigation, Software, Writing &#x2013; review &amp; editing. RD: Formal Analysis, Software, Visualization, Writing &#x2013; review &amp; editing. RB-F: Formal Analysis, Investigation, Writing &#x2013; review &amp; editing. CT: Formal Analysis, Writing &#x2013; review &amp; editing. CS-N: Data curation, Formal Analysis, Investigation, Resources, Writing &#x2013; review &amp; editing. BB: Investigation, Resources, Writing &#x2013; review &amp; editing. AS: Resources, Writing &#x2013; review &amp; editing. JD-f: Conceptualization, Supervision, Writing &#x2013; review &amp; editing. MT: Conceptualization, Funding acquisition, Project administration, Supervision, Writing &#x2013; review &amp; editing. RN: Conceptualization, Data curation, Project administration, Supervision, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing.</p>
</sec>
</body>
<back>
<sec id="s8" sec-type="funding-information">
<title>Funding</title>
<p>The authors declare financial support was received for the research, authorship, and/or publication of this article. This work was developed in the context of Instituto Nacional de Ci&#xea;ncia e Tecnologia em Ecologia, Evolu&#xe7;&#xe3;o e Conserva&#xe7;&#xe3;o da Biodiversidade (INCT &#x2013; EECBio), supported by Conselho Nacional de Desenvolvimento Cient&#xed;fico e Tecnol&#xf3;gico (CNPq &#x2013; process 465610/20145) and Funda&#xe7;&#xe3;o de Amparo &#xe0; Pesquisa do Estado de Goi&#xe1;s (FAPEG &#x2013; process 201810267000023). We are also thankful for the support from PPGS Coordena&#xe7;&#xe3;o de Aperfei&#xe7;oamento de Pessoal de N&#xed;vel Superior (CAPES)/FAPEG (#08/2014) and CNPq (MCTIC/CNPq #28/2018, 435477/2018-8). RN was supported by a PDCTR fellowship from FAPEG/CNPq (#202110267000863). RB-F was supported by a DTI fellowship from CNPq. A PNPD scholarship from CAPES supported CT. A productivity grant from CNPq has continuously supported MT, CS-N, and JD-f.</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>Reserva Particular Patrim&#xf4;nio Natural (RPPN) Ecocerrado Brasil team, we are grateful for the work carried out to conserve Brazilian medicinal species.</p>
</ack>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2023.1258794/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2023.1258794/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet_1.pdf" id="SM1" mimetype="application/pdf"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Acevedo-Rodriguez</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>1990</year>). <article-title>Distributional patterns in Brazilian serjania (Sapindaceae)</article-title>. <source>Acta Bot. Brasilica</source> <volume>4</volume>, <fpage>69</fpage>&#x2013;<lpage>82</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1590/s0102-33061990000100005</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Acevedo-Rodr&#xed;guez</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Welzen</surname> <given-names>P. C.</given-names>
</name>
<name>
<surname>Van, Adema</surname> <given-names>F.</given-names>
</name>
<name>
<surname>van der Ham</surname> <given-names>R. W. J. M.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Sapindaceae. Kubitzki, K. (eds) <italic>Flowering Plants. Eudicots. The Families and Genera of Vascular Plants</italic>
</article-title>. <volume>10</volume>, <page-range>357&#x2013;407</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-3-642-14397-7_17</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Acevedo-Rodr&#xed;guez</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Wurdack</surname> <given-names>K. J.</given-names>
</name>
<name>
<surname>Ferrucci</surname> <given-names>M. S.</given-names>
</name>
<name>
<surname>Johnson</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Dias</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Coelho</surname> <given-names>R. G.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Generic relationships and classification of tribe paullinieae (Sapindaceae) with a new concept of supertribe paulliniodae</article-title>. <source>Syst. Bot.</source> <volume>42</volume>, <fpage>96</fpage>&#x2013;<lpage>114</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1600/036364417X694926</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Allen</surname> <given-names>J. F.</given-names>
</name>
<name>
<surname>de Paula</surname> <given-names>W. B. M.</given-names>
</name>
<name>
<surname>Puthiyaveetil</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Nield</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>A structural phylogenetic map for chloroplast photosynthesis</article-title>. <source>Trends Plant Sci.</source> <volume>16</volume>, <fpage>645</fpage>&#x2013;<lpage>655</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.tplants.2011.10.004</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Amar</surname> <given-names>M. H.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>ycf1-ndhF genes, the most promising plastid genomic barcode, sheds light on phylogeny at low taxonomic levels in Prunus persica</article-title>. <source>J. Genet. Eng. Biotechnol.</source> <volume>18</volume>, <page-range>1&#x2013;10</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s43141-020-00057-3</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bausher</surname> <given-names>M. G.</given-names>
</name>
<name>
<surname>Singh</surname> <given-names>N. D.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>S. B.</given-names>
</name>
<name>
<surname>Jansen</surname> <given-names>R. K.</given-names>
</name>
<name>
<surname>Daniell</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>The complete chloroplast genome sequence of Citrus sinensis (L.) Osbeck var &#x201c;Ridge Pineapple&#x201d;: Organization and phylogenetic relationships to other angiosperms</article-title>. <source>BMC Plant Biol.</source> <volume>6</volume>, <page-range>1&#x2013;12</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2229-6-21</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Beier</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Thiel</surname> <given-names>T.</given-names>
</name>
<name>
<surname>M&#xfc;nch</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Scholz</surname> <given-names>U.</given-names>
</name>
<name>
<surname>Mascher</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>MISA-web: A web server for microsatellite prediction</article-title>. <source>Bioinformatics</source> <volume>33</volume>, <fpage>2583</fpage>&#x2013;<lpage>2585</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btx198</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Buerki</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Callmander</surname> <given-names>M. W.</given-names>
</name>
<name>
<surname>Acevedo-Rodriguez</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Lowry</surname> <given-names>P. P.</given-names>
</name>
<name>
<surname>Munzinger</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Bailey</surname> <given-names>P.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>An updated infra-familial classification of Sapindaceae based on targeted enrichment data</article-title>. <source>Am. J. Bot.</source> <volume>108</volume>, <fpage>1234</fpage>&#x2013;<lpage>1251</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/ajb2.1693</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Buerki</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Forest</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Acevedo-Rodr&#xed;guez</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Callmander</surname> <given-names>M. W.</given-names>
</name>
<name>
<surname>Nylander</surname> <given-names>J. A. A.</given-names>
</name>
<name>
<surname>Harrington</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2009</year>). <article-title>Plastid and nuclear DNA markers reveal intricate relationships at subfamilial and tribal levels in the soapberry family (Sapindaceae)</article-title>. <source>Mol. Phylogenet. Evol.</source> <volume>51</volume>, <fpage>238</fpage>&#x2013;<lpage>258</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ympev.2009.01.012</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Buerki</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Lowry</surname> <given-names>P. P.</given-names>
</name>
<name>
<surname>Alvarez</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Razafimandimbison</surname> <given-names>S. G.</given-names>
</name>
<name>
<surname>K&#xfc;pfer</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Callmander</surname> <given-names>M. W.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Phylogeny and circumscription of Sapindaceae revisited: Molecular sequence data, morphology and biogeography support recognition of a new family, Xanthoceraceae</article-title>. <source>Plant Ecol. Evol.</source> <volume>143</volume>, <fpage>148</fpage>&#x2013;<lpage>159</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5091/plecevo.2010.437</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<collab>CBOL Plant Working Group</collab>
</person-group> (<year>2009</year>). <article-title>A DNA barcode for land plants</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>106</volume>, <fpage>12794</fpage>&#x2013;<lpage>12797</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.0905845106</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chase</surname> <given-names>M. W.</given-names>
</name>
<name>
<surname>Christenhusz</surname> <given-names>M. J. M.</given-names>
</name>
<name>
<surname>Fay</surname> <given-names>M. F.</given-names>
</name>
<name>
<surname>Byng</surname> <given-names>J. W.</given-names>
</name>
<name>
<surname>Judd</surname> <given-names>W. S.</given-names>
</name>
<name>
<surname>Soltis</surname> <given-names>D. E.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>An update of the Angiosperm Phylogeny Group classification for the orders and families of flowering plants: APG IV</article-title>. <source>Botanical J. Linn. Soc.</source> <volume>181</volume>, <fpage>1</fpage>&#x2013;<lpage>20</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/boj.12385</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>The complete chloroplast genome sequence of Acer cinnamomifolium (Aceraceae), a plant species endemic to China</article-title>. <source>Mitochondrial DNA B Resour.</source> <volume>4</volume>, <fpage>3450</fpage>&#x2013;<lpage>3451</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/23802359.2019.1674211</pub-id>
</citation>
</ref>
<ref id="B501">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Christopher</surname> <given-names>D. A.</given-names>
</name>
<name>
<surname>Cushman</surname> <given-names>J. C.</given-names>
</name>
<name>
<surname>Price</surname> <given-names>C. A.</given-names>
</name>
<name>
<surname>Hallick</surname> <given-names>R. B.</given-names>
</name>
</person-group> (<year>1988</year>). <article-title>Organization of ribosomal protein genes rp123, rpl2, rpsl9, rpl22 and rps3 on the Euglena gracilis chloroplast genome</article-title>. <source>Curr. Genet.</source> <volume>14</volume>, <fpage>275</fpage>&#x2013;<lpage>285</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/BF00376748</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Darling</surname> <given-names>A. C. E.</given-names>
</name>
<name>
<surname>Mau</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Blattner</surname> <given-names>F. R.</given-names>
</name>
<name>
<surname>Perna</surname> <given-names>N. T.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Mauve: Multiple alignment of conserved genomic sequence with rearrangements</article-title>. <source>Genome Res.</source> <volume>14</volume>, <fpage>1394</fpage>&#x2013;<lpage>1403</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/gr.2289704</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Darshetkar</surname> <given-names>A. M.</given-names>
</name>
<name>
<surname>Maurya</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Bazarragchaa</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Batdelger</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Janchiv</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Plastome analysis unveils Inverted Repeat (IR) expansion and positive selection in Sea Lavenders (Limonium, Plumbaginaceae, Limonioideae, Limonieae)</article-title>. <source>PhytoKeys</source> <volume>175</volume>, <fpage>89</fpage>&#x2013;<lpage>107</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3897/phytokeys.175.61054</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dierckxsens</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Mardulyn</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Smits</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>NOVOPlasty: <italic>De novo</italic> assembly of organelle genomes from whole genome data</article-title>. <source>Nucleic Acids Res.</source> <volume>45</volume>, <page-range>1&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkw955</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dong</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Ming</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Chloroplast genome of rambutan and comparative analyses in sapindaceae</article-title>. <source>Plants</source> <volume>10</volume>, <fpage>1</fpage>&#x2013;<lpage>15</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/plants10020283</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dong</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zuo</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>ycf1, the most promising plastid DNA barcode of land plants</article-title>. <source>Sci. Rep.</source> <volume>5</volume>
<elocation-id>8348</elocation-id>, <page-range>1&#x2013;5</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/srep08348</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Doyle</surname> <given-names>J. J.</given-names>
</name>
<name>
<surname>Doyle</surname> <given-names>J. L.</given-names>
</name>
</person-group> (<year>1987</year>). <article-title>A rapid DNA isolation procedure for small quantities of fresh leaf tissue</article-title>. <source>Phytochem. Bull.</source> <volume>19</volume>, <fpage>11</fpage>&#x2013;<lpage>15</lpage>.</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dugas</surname> <given-names>D. V.</given-names>
</name>
<name>
<surname>Hernandez</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Koenen</surname> <given-names>E. J. M.</given-names>
</name>
<name>
<surname>Schwarz</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Straub</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Hughes</surname> <given-names>C. E.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>Mimosoid legume plastome evolution: IR expansion, tandem repeat expansions, and accelerated rate of evolution in clpP</article-title>. <source>Sci. Rep.</source> <volume>5</volume>, <page-range>1&#x2013;13</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/srep16958</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fan</surname> <given-names>W. B.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Shahzad</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z. H.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Comparative chloroplast genomics of dipsacales species: Insights into sequence variation, adaptive evolution, and phylogenetic relationships</article-title>. <source>Front. Plant Sci.</source> <volume>9</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2018.00689</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ferrucci</surname> <given-names>M. S.</given-names>
</name>
<name>
<surname>Acevedo-Rodr&#xed;guez</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Three new species of Serjania (Sapindaceae) from south America</article-title>. <source>Syst. Bot.</source> <volume>30</volume>, <fpage>153</fpage>&#x2013;<lpage>162</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1600/0363644053661904</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gantt</surname> <given-names>J. S.</given-names>
</name>
<name>
<surname>Baldauf</surname> <given-names>S. L.</given-names>
</name>
<name>
<surname>Calie</surname> <given-names>P. J.</given-names>
</name>
<name>
<surname>Weeden</surname> <given-names>N. F.</given-names>
</name>
<name>
<surname>Palmer</surname> <given-names>J. D.</given-names>
</name>
</person-group> (<year>1991</year>). <article-title>Transfer of rpl22 to the nucleus greatly preceded its loss from the chloroplast and involved the gain of an intron</article-title>. <source>EMBO J.</source> <volume>10</volume>, <fpage>3073</fpage>&#x2013;<lpage>3078</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/j.1460-2075.1991.tb07859.x</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gomig</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Pietrovski</surname> <given-names>E. F.</given-names>
</name>
<name>
<surname>Guedes</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Dalmarco</surname> <given-names>E. M.</given-names>
</name>
<name>
<surname>Calderari</surname> <given-names>M. T.</given-names>
</name>
<name>
<surname>Guimar&#xe3;es</surname> <given-names>C. L.</given-names>
</name>
<etal/>
</person-group>. (<year>2008</year>). <article-title>Topical anti-inflammatory activity of Serjania erecta Radlk (Sapindaceae) extracts</article-title>. <source>J. Ethnopharmacol.</source> <volume>118</volume>, <fpage>220</fpage>&#x2013;<lpage>224</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jep.2008.03.017</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hildebrand</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Hallick</surname> <given-names>R. B.</given-names>
</name>
<name>
<surname>Passavant</surname> <given-names>C. W.</given-names>
</name>
<name>
<surname>Bourque</surname> <given-names>D. P.</given-names>
</name>
</person-group> (<year>1988</year>). <article-title>Trans-splicing in chloroplasts: The rpsl2 loci of Nicotiana tabacum</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>85</volume>, <page-range>372&#x2013;376</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.85.2.372</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hiruma-Lima</surname> <given-names>C. A.</given-names>
</name>
<name>
<surname>Castelo</surname> <given-names>A. P. C.</given-names>
</name>
<name>
<surname>Arruda</surname> <given-names>B. N.</given-names>
</name>
<name>
<surname>Coelho</surname> <given-names>R. G.</given-names>
</name>
<name>
<surname>Honda</surname> <given-names>N. K.</given-names>
</name>
<name>
<surname>Ferrazoli</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2009</year>). <article-title>Gastroprotective effect of Serjania erecta Radlk (Sapindaceae): Involvement of sensory neurons, endogenous nonprotein sulfhydryls, and nitric oxide</article-title>. <source>J. Med. Food</source> <volume>12</volume>, <fpage>1411</fpage>&#x2013;<lpage>1415</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1089/jmf.2008.0269</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jansen</surname> <given-names>R. K.</given-names>
</name>
<name>
<surname>Ruhlman</surname> <given-names>T. A.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Plastid genomes of seed plants</article-title>. <source>Genomics of Chloroplasts and Mitochondria, Advances in Photosynthesis and Respiration</source>. <volume>35</volume>, <page-range>103&#x2013;126</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-94-007-2920-9_5</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jud</surname> <given-names>N. A.</given-names>
</name>
<name>
<surname>Allen</surname> <given-names>S. E.</given-names>
</name>
<name>
<surname>Nelson</surname> <given-names>C. W.</given-names>
</name>
<name>
<surname>Bastos</surname> <given-names>C. L.</given-names>
</name>
<name>
<surname>Chery</surname> <given-names>J. G.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Climbing since the early Miocene: The fossil record of Paullinieae (Sapindaceae)</article-title>. <source>PloS One</source> <volume>16</volume>, <page-range>1&#x2013;22</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0248369</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kalyaanamoorthy</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Minh</surname> <given-names>B. Q.</given-names>
</name>
<name>
<surname>Wong</surname> <given-names>T. K. F.</given-names>
</name>
<name>
<surname>Von Haeseler</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Jermiin</surname> <given-names>L. S.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>ModelFinder: Fast model selection for accurate phylogenetic estimates</article-title>. <source>Nat. Methods</source> <volume>14</volume>, <fpage>587</fpage>&#x2013;<lpage>589</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nmeth.4285</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kang</surname> <given-names>B. C.</given-names>
</name>
<name>
<surname>Bae</surname> <given-names>S. J.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>J. S.</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>H.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Chloroplast and mitochondrial DNA editing in plants</article-title>. <source>Nat. Plants</source> <volume>7</volume>, <fpage>899</fpage>&#x2013;<lpage>905</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41477-021-00943-9</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Katoh</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Standley</surname> <given-names>D. M.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>MAFFT multiple sequence alignment software version 7: Improvements in performance and usability</article-title>. <source>Mol. Biol. Evol.</source> <volume>30</volume>, <fpage>772</fpage>&#x2013;<lpage>780</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/mst010</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kearse</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Moir</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Wilson</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Stones-Havas</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Cheung</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Sturrock</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2012</year>). <article-title>Geneious Basic: An integrated and extendable desktop software platform for the organization and analysis of sequence data</article-title>. <source>Bioinformatics</source> <volume>28</volume>, <fpage>1647</fpage>&#x2013;<lpage>1649</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bts199</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kent</surname> <given-names>W. J.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>BLAT &#x2014;The BLAST -like alignment tool</article-title>. <source>Genome Res.</source> <volume>12</volume>, <fpage>656</fpage>&#x2013;<lpage>664</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/gr.229202</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kikuchi</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Asakura</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Imai</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Nakahira</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Kotani</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Hashiguchi</surname> <given-names>Y.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>A Ycf2-FtsHi heteromeric AAA-ATPase complex is required for chloroplast protein import</article-title>. <source>Plant Cell</source> <volume>30</volume>, <fpage>2677</fpage>&#x2013;<lpage>2703</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1105/tpc.18.00357</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kikuchi</surname> <given-names>S.</given-names>
</name>
<name>
<surname>B&#xe9;dard</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Hirano</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Hirabayashi</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Oishi</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Imai</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2013</year>). <article-title>Uncovering the protein translocon at the chloroplast inner envelope membrane</article-title>. <source>Sci. (1979)</source> <volume>339</volume>, <fpage>571</fpage>&#x2013;<lpage>574</lpage>.</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>K&#xf6;hler</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Reginato</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Souza-Chies</surname> <given-names>T. T.</given-names>
</name>
<name>
<surname>Majure</surname> <given-names>L. C.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Insights into chloroplast genome evolution across opuntioideae (Cactaceae) reveals robust yet sometimes conflicting phylogenetic topologies</article-title>. <source>Front. Plant Sci.</source> <volume>11</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2020.00729</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kr&#xfc;ger</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Abeyawardana</surname> <given-names>O. A. J.</given-names>
</name>
<name>
<surname>Ju&#x159;&#xed;&#x10d;ek</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Kr&#xfc;ger</surname> <given-names>C.</given-names>
</name>
<name>
<surname>&#x160;torchov&#xe1;</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Variation in plastid genomes in the gynodioecious species Silene vulgaris</article-title>. <source>BMC Plant Biol.</source> <volume>19</volume>, <page-range>1&#x2013;15</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12870-019-2193-0</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Kurtz</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Choudhuri</surname> <given-names>J. V.</given-names>
</name>
<name>
<surname>Ohlebusch</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Schleiermacher</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Stoye</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Giegerich</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2001</year>). <source>REPuter: the manifold applications of repeat analysis on a genomic scale. Nucleic Acids Res.</source> <volume>29</volume>, <page-range>4633&#x2013;4642</page-range>. doi: <pub-id pub-id-type="doi">10.1093/nar/29.22.4633</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Laslett</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Canback</surname> <given-names>B.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>ARAGORN, a program to detect tRNA genes and tmRNA genes in nucleotide sequences</article-title>. <source>Nucleic Acids Res.</source> <volume>32</volume>, <fpage>11</fpage>&#x2013;<lpage>16</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkh152</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Leebens-Mack</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Raubeson</surname> <given-names>L. A.</given-names>
</name>
<name>
<surname>Cui</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Kuehl</surname> <given-names>J. V.</given-names>
</name>
<name>
<surname>Fourcade</surname> <given-names>M. H.</given-names>
</name>
<name>
<surname>Chumley</surname> <given-names>T. W.</given-names>
</name>
<etal/>
</person-group>. (<year>2005</year>). <article-title>Identifying the basal angiosperm node in chloroplast genome phylogenies: Sampling one&#x2019;s way out of the Felsenstein zone</article-title>. <source>Mol. Biol. Evol.</source> <volume>22</volume>, <fpage>1948</fpage>&#x2013;<lpage>1963</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msi191</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Long</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>The complete chloroplast genome sequence of tung tree (Vernicia fordii): Organization and phylogenetic relationships with other angiosperms</article-title>. <source>Sci. Rep.</source> <volume>7</volume>, <page-range>1&#x2013;11</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-017-02076-6</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Lou</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Cai</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Cheng</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2020</year>b). <article-title>Comparison of the complete plastomes and the phylogenetic analysis of Paulownia species</article-title>. <source>Sci. Rep.</source> <volume>10</volume>, <page-range>1&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-020-59204-y</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Peng</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Peng</surname> <given-names>X.</given-names>
</name>
</person-group> (<year>2020</year>a). <article-title>Initial characterization of the chloroplast genome of vicia sepium, an important wild resource plant, and related inferences about its evolution</article-title>. <source>Front. Genet.</source> <volume>11</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fgene.2020.00073</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lohse</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Drechsel</surname> <given-names>O.</given-names>
</name>
<name>
<surname>Kahlau</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Bock</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>OrganellarGenomeDRAW&#x2013;a suite of tools for generating physical maps of plastid and mitochondrial genomes and visualizing expression data sets</article-title>. <source>Nucleic Acids Res.</source> <volume>41</volume>, <page-range>W575&#x2013;W581</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkt289</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ma</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Bi</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Characterization of the complete chloroplast genome of acer truncatum bunge (Sapindales: Aceraceae): A new woody oil tree species producing nervonic acid</article-title>. <source>BioMed. Res. Int.</source> <volume>2019</volume>, <page-range>1&#x2013;13</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1155/2019/7417239</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Margulis</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Bermudes</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>1985</year>). <article-title>Symbiosis as a mechanism of evolution: status of cell symbiosis theory</article-title>. <source>Symbiosis</source> <volume>1</volume>, <fpage>101</fpage>&#x2013;<lpage>124</lpage>.</citation>
</ref>
<ref id="B47">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Millen</surname> <given-names>R. S.</given-names>
</name>
<name>
<surname>Olmstead</surname> <given-names>R. G.</given-names>
</name>
<name>
<surname>Adams</surname> <given-names>K. L.</given-names>
</name>
<name>
<surname>Palmer</surname> <given-names>J. D.</given-names>
</name>
<name>
<surname>Lao</surname> <given-names>N. T.</given-names>
</name>
<name>
<surname>Heggie</surname> <given-names>L.</given-names>
</name>
<etal/>
</person-group>. (<year>2001</year>) <source>Many Parallel Losses of infA from Chloroplast DNA during Angiosperm Evolution with Multiple Independent Transfers to the Nucleus</source>. Available at: <uri xlink:href="http://www.plantcell.org">www.plantcell.org</uri>.</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moore</surname> <given-names>M. J.</given-names>
</name>
<name>
<surname>Soltis</surname> <given-names>P. S.</given-names>
</name>
<name>
<surname>Bell</surname> <given-names>C. D.</given-names>
</name>
<name>
<surname>Burleigh</surname> <given-names>J. G.</given-names>
</name>
<name>
<surname>Soltis</surname> <given-names>D. E.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Phylogenetic analysis of 83 plastid genes further resolves the early diversification of eudicots</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>107</volume>, <fpage>4623</fpage>&#x2013;<lpage>4628</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.0907801107</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Muellner-Riehl</surname> <given-names>A. N.</given-names>
</name>
<name>
<surname>Weeks</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Clayton</surname> <given-names>J. W.</given-names>
</name>
<name>
<surname>Buerki</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Nauheimer</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Chiang</surname> <given-names>Y. C.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>Molecular phylogenetics and molecular clock dating of Sapindales based on plastid rbcL, atpB and trnL-trnF DNA sequences</article-title>. <source>Taxon</source> <volume>65</volume>, <fpage>1019</fpage>&#x2013;<lpage>1036</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.12705/655.5</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Nei</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Kumar</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2000</year>). <source>Molecular evolution and phylogenetics</source> (<publisher-loc>New York, New York, USA</publisher-loc>: <publisher-name>Oxford University Press</publisher-name>).</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nguyen</surname> <given-names>L. T.</given-names>
</name>
<name>
<surname>Schmidt</surname> <given-names>H. A.</given-names>
</name>
<name>
<surname>Von Haeseler</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Minh</surname> <given-names>B. Q.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>IQ-TREE: A fast and effective stochastic algorithm for estimating maximum-likelihood phylogenies</article-title>. <source>Mol. Biol. Evol.</source> <volume>32</volume>, <fpage>268</fpage>&#x2013;<lpage>274</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msu300</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Novoa</surname> <given-names>E. M.</given-names>
</name>
<name>
<surname>Pavon-Eternod</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Pan</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Ribas De Pouplana</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>A role for tRNA modifications in genome structure and codon usage</article-title>. <source>Cell</source> <volume>149</volume>, <fpage>202</fpage>&#x2013;<lpage>213</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cell.2012.01.050</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Okonechnikov</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Golosova</surname> <given-names>O.</given-names>
</name>
<name>
<surname>Fursov</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Varlamov</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Vaskin</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Efremov</surname> <given-names>I.</given-names>
</name>
<etal/>
</person-group>. (<year>2012</year>). <article-title>Unipro UGENE: A unified bioinformatics toolkit</article-title>. <source>Bioinformatics</source> <volume>28</volume>, <fpage>1166</fpage>&#x2013;<lpage>1167</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bts091</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Park</surname> <given-names>H. S.</given-names>
</name>
<name>
<surname>Jeon</surname> <given-names>J. H.</given-names>
</name>
<name>
<surname>Cho</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Park</surname> <given-names>J. Y.</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2023</year>). <article-title>High-throughput discovery of plastid genes causing albino phenotypes in ornamental chimeric plants</article-title>. <source>Hortic. Res.</source> <volume>10</volume>, <page-range>1&#x2013;11</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/hr/uhac246</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pl&#xf6;chinger</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Torabi</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Rantala</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Tikkanen</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Suorsa</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Jensen</surname> <given-names>P. E.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>The low molecular weight protein psai stabilizes the light-harvesting complex II docking site of photosystem I</article-title>. <source>Plant Physiol.</source> <volume>172</volume>, <fpage>450</fpage>&#x2013;<lpage>463</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1104/pp.16.00647</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ram&#xed;rez-Barahona</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Sauquet</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Magall&#xf3;n</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>The delayed and geographically heterogeneous diversification of flowering plant families</article-title>. <source>Nat. Ecol. Evol.</source> <volume>4</volume>, <fpage>1232</fpage>&#x2013;<lpage>1238</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41559-020-1241-3</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="book">
<person-group person-group-type="author">
<collab>R Core Team</collab>
</person-group> (<year>2020</year>). <source>R: A language and environment for statistical computing</source> (<publisher-loc>Vienna, Austria</publisher-loc>: <publisher-name>R Foundation for Statistical Computing</publisher-name>).</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rodr&#xed;guez-Ezpeleta</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Brinkmann</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Burey</surname> <given-names>S. C.</given-names>
</name>
<name>
<surname>Roure</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Burger</surname> <given-names>G.</given-names>
</name>
<name>
<surname>L&#xf6;ffelhardt</surname> <given-names>W.</given-names>
</name>
<etal/>
</person-group>. (<year>2005</year>). <article-title>Monophyly of primary photosynthetic eukaryotes: Green plants, red algae, and glaucophytes</article-title>. <source>Curr. Biol.</source> <volume>15</volume>, <fpage>1325</fpage>&#x2013;<lpage>1330</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cub.2005.06.040</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rozas</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Ferrer-Mata</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Sanchez-DelBarrio</surname> <given-names>J. C.</given-names>
</name>
<name>
<surname>Guirao-Rico</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Librado</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Ramos-Onsins</surname> <given-names>S. E.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>DnaSP 6: DNA sequence polymorphism analysis of large data sets</article-title>. <source>Mol. Biol. Evol.</source> <volume>34</volume>, <fpage>3299</fpage>&#x2013;<lpage>3302</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msx248</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Saina</surname> <given-names>J. K.</given-names>
</name>
<name>
<surname>Gichira</surname> <given-names>A. W.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z. Z.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>G. W.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Q. F.</given-names>
</name>
<name>
<surname>Liao</surname> <given-names>K.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>The complete chloroplast genome sequence of Dodonaea viscosa: comparative and phylogenetic analyses</article-title>. <source>Genetica</source> <volume>146</volume>, <fpage>101</fpage>&#x2013;<lpage>113</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10709-017-0003-x</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sato</surname> <given-names>N.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Complex origins of chloroplast membranes with photosynthetic machineries: multiple transfers of genes from divergent organisms at different times or a single endosymbiotic event</article-title>? <source>J. Plant Res.</source> <volume>133</volume>, <fpage>15</fpage>&#x2013;<lpage>33</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10265-019-01157-z</pub-id>
</citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sch&#xf6;ttler</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Thiele</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Belkius</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Bergner</surname> <given-names>S. V.</given-names>
</name>
<name>
<surname>Fl&#xfc;gel</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Wittenberg</surname> <given-names>G.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>The plastid-encoded PsaI subunit stabilizes photosystem i during leaf senescence in tobacco</article-title>. <source>J. Exp. Bot.</source> <volume>68</volume>, <fpage>1137</fpage>&#x2013;<lpage>1155</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/jxb/erx009</pub-id>
</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sobreiro</surname> <given-names>M. B.</given-names>
</name>
<name>
<surname>Vieira</surname> <given-names>L. D.</given-names>
</name>
<name>
<surname>Nunes</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Novaes</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Coissac</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Silva-Junior</surname> <given-names>O. B.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Chloroplast genome assembly of Handroanthus impetiginosus: comparative analysis and molecular evolution in Bignoniaceae</article-title>. <source>Planta</source> <volume>252</volume>, <page-range>1&#x2013;16</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00425-020-03498-9</pub-id>
</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Somner</surname> <given-names>G. V.</given-names>
</name>
<name>
<surname>Ferrucci</surname> <given-names>M. S.</given-names>
</name>
<name>
<surname>Acevedo-Rodr&#xed;guez</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Serjania in Lista de Esp&#xe9;cies da Flora do Brasil</article-title>. <source>Jardim Bot&#xe2;nico do Rio Janeiro.</source>  Available at: <uri xlink:href="https://floradobrasil.jbrj.gov.br/F">https://floradobrasil.jbrj.gov.br/F</uri> (Accessed March 19, 2023). </citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Souza</surname> <given-names>U. J. B. d.</given-names>
</name>
<name>
<surname>Nunes</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Targueta</surname> <given-names>C. P.</given-names>
</name>
<name>
<surname>Diniz-Filho</surname> <given-names>J. A. F.</given-names>
</name>
<name>
<surname>Telles</surname> <given-names>M. P. d. C.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>The complete chloroplast genome of Stryphnodendron adstringens (Leguminosae - Caesalpinioideae): comparative analysis with related Mimosoid species</article-title>. <source>Sci. Rep.</source> <volume>9</volume>, <page-range>1&#x2013;12</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-019-50620-3</pub-id>
</citation>
</ref>
<ref id="B500">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Steinmann</surname> <given-names>V. W.</given-names>
</name>
<name>
<surname>Ferrucci</surname> <given-names>M. S.</given-names>
</name>
<name>
<surname>Maya-Lastra</surname> <given-names>C. A.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Phylogenetics of Serjania (Sapindaceae-Paullinieae), with emphasis on fruit evolution and the description of a new species from Michoac&#xe1;n, Mexico</article-title>. <source>Syst. Biodivers.</source> <volume>20</volume>, <fpage>1</fpage>&#x2013;<lpage>21</lpage>. doi: <pub-id pub-id-type="doi">10.1080/14772000.2022.2030425</pub-id>
</citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Swanson</surname> <given-names>W. J.</given-names>
</name>
<name>
<surname>Nielsen</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>Q.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Pervasive adaptive evolution in mammalian fertilization proteins</article-title>. <source>Mol. Biol. Evol.</source> <volume>20</volume>, <fpage>18</fpage>&#x2013;<lpage>20</lpage>. doi: <pub-id pub-id-type="doi">10.1093/oxfordjournals.molbev.a004233</pub-id>
</citation>
</ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Talavera</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Castresana</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Improvement of phylogenies after removing divergent and ambiguously aligned blocks from protein sequence alignments</article-title>. <source>Syst. Biol.</source> <volume>56</volume>, <fpage>564</fpage>&#x2013;<lpage>577</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/10635150701472164</pub-id>
</citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tillich</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Lehwark</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Pellizzer</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Ulbricht-Jones</surname> <given-names>E. S.</given-names>
</name>
<name>
<surname>Fischer</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Bock</surname> <given-names>R.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>GeSeq - Versatile and accurate annotation of organelle genomes</article-title>. <source>Nucleic Acids Res.</source> <volume>45</volume>, <fpage>W6</fpage>&#x2013;<lpage>W11</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkx391</pub-id>
</citation>
</ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Urdampilleta</surname> <given-names>J. D.</given-names>
</name>
<name>
<surname>Ferrucci</surname> <given-names>M. S.</given-names>
</name>
<name>
<surname>Vanzela</surname> <given-names>A. L. L.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Cytogenetic studies in South American species of Serjania (Sapindaceae: Paullinieae)</article-title>. <source>Plant Biosyst.</source> <volume>146</volume>, <fpage>835</fpage>&#x2013;<lpage>846</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/11263504.2012.705349</pub-id>
</citation>
</ref>
<ref id="B70">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vaidya</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Lohman</surname> <given-names>D. J.</given-names>
</name>
<name>
<surname>Meier</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>SequenceMatrix: Concatenation software for the fast assembly of multi-gene datasets with character set and codon information</article-title>. <source>Cladistics</source> <volume>27</volume>, <fpage>171</fpage>&#x2013;<lpage>180</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1096-0031.2010.00329.x</pub-id>
</citation>
</ref>
<ref id="B71">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Varshney</surname> <given-names>R. K.</given-names>
</name>
<name>
<surname>Graner</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Sorrells</surname> <given-names>M. E.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Genic microsatellite markers in plants: Features and applications</article-title>. <source>Trends Biotechnol.</source> <volume>23</volume>, <fpage>48</fpage>&#x2013;<lpage>55</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.tibtech.2004.11.005</pub-id>
</citation>
</ref>
<ref id="B72">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>X.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Whole-Genome comparison reveals divergent IR borders and mutation hotspots in chloroplast genomes of herbaceous bamboos (Bambusoideae: Olyreae)</article-title>. <source>Molecules</source> <volume>23</volume>, <page-range>1&#x2013;20</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/molecules23071537</pub-id>
</citation>
</ref>
<ref id="B73">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>Y. H.</given-names>
</name>
<name>
<surname>Qu</surname> <given-names>X. J.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>S. Y.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>D. Z.</given-names>
</name>
<name>
<surname>Yi</surname> <given-names>T. S.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Plastomes of Mimosoideae: structural and size variation, sequence divergence, and phylogenetic implication</article-title>. <source>Tree Genet. Genomes</source> <volume>13</volume>, <page-range>1&#x2013;18</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11295-017-1124-1</pub-id>
</citation>
</ref>
<ref id="B74">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wheeler</surname> <given-names>T. J.</given-names>
</name>
<name>
<surname>Eddy</surname> <given-names>S. R.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Nhmmer: DNA homology search with profile HMMs</article-title>. <source>Bioinformatics</source> <volume>29</volume>, <fpage>2487</fpage>&#x2013;<lpage>2489</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btt403</pub-id>
</citation>
</ref>
<ref id="B75">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wicke</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Schneeweiss</surname> <given-names>G. M.</given-names>
</name>
<name>
<surname>dePamphilis</surname> <given-names>C. W.</given-names>
</name>
<name>
<surname>M&#xfc;ller</surname> <given-names>K. F.</given-names>
</name>
<name>
<surname>Quandt</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>The evolution of the plastid chromosome in land plants: Gene content, gene order, gene function</article-title>. <source>Plant Mol. Biol.</source> <volume>76</volume>, <fpage>273</fpage>&#x2013;<lpage>297</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11103-011-9762-4</pub-id>
</citation>
</ref>
<ref id="B76">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>D. G.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>X. J.</given-names>
</name>
<name>
<surname>Pei</surname> <given-names>X. Y.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Comparative chloroplast genomics of Gossypium species: Insights into repeat sequence variations and phylogeny</article-title>. <source>Front. Plant Sci.</source> <volume>9</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2018.00376</pub-id>
</citation>
</ref>
<ref id="B77">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xiao-Ming</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Junrui</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Sha</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Hongbo</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Lan</surname> <given-names>Q.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Inferring the evolutionary mechanism of the chloroplast genome size by comparing whole-chloroplast genome sequences in seed plants</article-title>. <source>Sci. Rep.</source> <volume>7</volume>, <page-range>1&#x2013;10</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-017-01518-5</pub-id>
</citation>
</ref>
<ref id="B78">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>Z.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>PAML 4: Phylogenetic analysis by maximum likelihood</article-title>. <source>Mol. Biol. Evol.</source> <volume>24</volume>, <fpage>1586</fpage>&#x2013;<lpage>1591</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msm088</pub-id>
</citation>
</ref>
<ref id="B79">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Swanson</surname> <given-names>W. J.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Codon-substitution models to detect adaptive evolution that account for heterogeneous selective pressures among site classes</article-title>. <source>Mol. Biol. Evol.</source> <volume>19</volume>, <fpage>49</fpage>&#x2013;<lpage>57</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/oxfordjournals.molbev.a003981</pub-id>
</citation>
</ref>
<ref id="B80">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zeb</surname> <given-names>U.</given-names>
</name>
<name>
<surname>Dong</surname> <given-names>W.-L.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>T.-T.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>R.-N.</given-names>
</name>
<name>
<surname>Shahzad</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>X.-F.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Comparative plastid genomics of Pinus species: Insights into sequence variations and phylogenetic relationships</article-title>. <source>JSE J. Syst. Evol.</source> <volume>00</volume>, <page-range>1&#x2013;15</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/jse.12492</pub-id>
</citation>
</ref>
<ref id="B81">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>Y. J.</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>P. F.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>D. Z.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>High-throughput sequencing of six bamboo chloroplast genomes: Phylogenetic implications for temperate woody bamboos (Poaceae: Bambusoideae)</article-title>. <source>PloS One</source> <volume>6</volume>, <page-range>1&#x2013;16</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0020596</pub-id>
</citation>
</ref>
<ref id="B82">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Wei</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Chang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Bai</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>Comparative transcriptome and chloroplast genome analyses of two related dipteronia species</article-title>. <source>Front. Plant Sci.</source> <volume>7</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2016.01512</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>