<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2024.1394244</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Analysis of phylogenetic relationships in <italic>Macadamia</italic> shows evidence of extensive reticulate evolution</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Manatunga</surname>
<given-names>Sachini Lakmini</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Furtado</surname>
<given-names>Agnelo</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/289599"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Topp</surname>
<given-names>Bruce</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1597601"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Alam</surname>
<given-names>Mobashwer</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/743911"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Mason</surname>
<given-names>Patrick J.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Kharabian-Masouleh</surname>
<given-names>Ardashir</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Henry</surname>
<given-names>Robert J.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/103236"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Queensland Alliance for Agriculture &amp; Food Innovation (QAAFI), University of Queensland</institution>, <addr-line>St Lucia, QLD</addr-line>, <country>Australia</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>ARC Centre of Excellence for Plant Success in Nature and Agriculture, The University of Queensland</institution>, <addr-line>St Luci, QLD</addr-line>, <country>Australia</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Queensland Alliance for Agriculture &amp; Food Innovation (QAAFI), Maroochy Research Facility, The University of Queensland</institution>, <addr-line>Nambour, QLD</addr-line>, <country>Australia</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Yu-Chung Chiang, National Sun Yat-sen University, Taiwan</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Carlos A. Machado, University of Maryland, College Park, United States</p>
<p>Isabel Marques, Universidade de Lisboa, Portugal</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Robert J. Henry, <email xlink:href="mailto:robert.henry@uq.edu.au">robert.henry@uq.edu.au</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>15</day>
<month>10</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>15</volume>
<elocation-id>1394244</elocation-id>
<history>
<date date-type="received">
<day>01</day>
<month>03</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>02</day>
<month>09</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Manatunga, Furtado, Topp, Alam, Mason, Kharabian-Masouleh and Henry</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Manatunga, Furtado, Topp, Alam, Mason, Kharabian-Masouleh and Henry</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>The genus <italic>Macadamia</italic> in the Proteaceae family includes four species native to Australia. Two of the four species, <italic>M. integrifolia</italic> and <italic>M. tetraphylla</italic>, have recently been utilized to generate domesticated macadamia varieties, grown for their edible nuts. To explore diversity in macadamia genetic resources, a total of 166 wild genotypes, representing all four species, were sequenced. The four species were clearly distinguished as four separate clades in a phylogenetic analysis of the nuclear genome (based upon concatenated nuclear gene CDS and SNPs). The two larger species (<italic>M. integrifolia</italic> and <italic>M. tetraphylla</italic>) formed a clade, that had diverged from a clade including the smaller species (<italic>M. ternifolia</italic> and <italic>M. jansenii</italic>). The greatest diversity in nuclear and chloroplast genomes was found in the more widely distributed <italic>M. integrifolia</italic> while the rare <italic>M. jansenii</italic> showed little diversity. The chloroplast phylogeny revealed a much more complex evolutionary history. Multiple chloroplast capture events have resulted in chloroplast genome clades, including genotypes from different species. This suggests extensive reticulate evolution in <italic>Macadamia</italic> despite the emergence of the four distinct species that are supported by the analysis of their nuclear genomes. The chloroplast genomes showed strong associations with geographical distribution reflecting limited maternal gene movement in these species that have large seeds. The nuclear genomes showed lesser geographical differences, probably reflecting the longer distance pollen movement. This improved understanding of the distribution of diversity in <italic>Macadamia</italic> will aid in the conservation of these rare species now found in highly fragmented rainforest remnants.</p>
</abstract>
<kwd-group>
<kwd>
<italic>Macadamia</italic>
</kwd>
<kwd>phylogenetic</kwd>
<kwd>wild</kwd>
<kwd>chloroplast</kwd>
<kwd>nuclear genes</kwd>
<kwd>chloroplast capture</kwd>
</kwd-group>
<counts>
<fig-count count="6"/>
<table-count count="0"/>
<equation-count count="0"/>
<ref-count count="52"/>
<page-count count="12"/>
<word-count count="6910"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Plant Systematics and Evolution</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Phylogenetics, the study of evolutionary relationships among organisms, has become a powerful tool in a variety of biological disciplines (<xref ref-type="bibr" rid="B21">Liu et&#xa0;al., 2022</xref>). Over the last few decades, substantial effort has been made to understand the phylogenetic associations among angiosperms through the application of DNA sequence data (<xref ref-type="bibr" rid="B12">Jansen et&#xa0;al., 2006</xref>). Next-generation sequencing (NGS) has brought a transformation in sequence analysis by making it more affordable and increasing access to complete chloroplast and nuclear genome data (<xref ref-type="bibr" rid="B52">Zhou et&#xa0;al., 2021</xref>). There has been an emphasis by breeders to exploit wild germplasm, but a significant portion remains underutilized (<xref ref-type="bibr" rid="B51">Zhang and Batley, 2020</xref>). The lack of genomic data on wild germplasm is one barrier to its effective use in plant breeding efforts, and as a result, the integration of genes from wild germplasm into cultivated varieties has been limited. Recent advancements in genomics and bioinformatics have provided opportunities to unlock the hidden potential within wild germplasm (<xref ref-type="bibr" rid="B42">Tanksley, 1997</xref>) by extending this technology to less-studied plant species. This has opened new avenues to incorporate materials from wild germplasm (<xref ref-type="bibr" rid="B51">Zhang and Batley, 2020</xref>).</p>
<p>Macadamia is an evergreen perennial rainforest tree of the family Proteaceae and is indigenous to Australia (<xref ref-type="bibr" rid="B10">Hardner et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B45">Walton, 2011</xref>; <xref ref-type="bibr" rid="B34">O&#x2019;Connor et&#xa0;al., 2019</xref>). The genus <italic>Macadamia</italic> is the only angiosperm that has been domesticated as a large-scale commercial food crop in Australia (<xref ref-type="bibr" rid="B5">Aradhya et&#xa0;al., 1998</xref>). In accordance with the present classification of Proteaceae (<xref ref-type="bibr" rid="B25">Mast et&#xa0;al., 2008</xref>), the genus <italic>Macadamia</italic> has been classified into four species, namely, <italic>M. integrifolia</italic> (Maiden &amp; Betche), <italic>M. tetraphylla</italic> (L.A.S. Johnson), <italic>M. ternifolia</italic> (F. Muell), and <italic>M. jansenii</italic> (C.L. Gross &amp; P.H. Weston), using molecular and morphological data, while many species previously classified as <italic>Macadamia</italic> have been transferred to other genera. Among the four species, <italic>M. integrifolia</italic> has the widest natural distribution, extending from southeast Queensland to the New South Wales border. Two overlapping distributions lead to natural hybridization between <italic>M. integrifolia</italic> and <italic>M. tetraphylla</italic> and between <italic>M. integrifolia</italic> and <italic>M. ternifolia</italic> (<xref ref-type="bibr" rid="B34">O&#x2019;Connor et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B44">Topp et&#xa0;al., 2019</xref>). <italic>M. tetraphylla</italic> is mostly distributed in New South Wales, while <italic>M. ternifolia</italic> is distributed north of Brisbane, extending from the Samford Valley to Gympie (<xref ref-type="bibr" rid="B44">Topp et&#xa0;al., 2019</xref>). <italic>M. jansenii</italic> is the most geographically isolated species and is found only in Bulburin National Park north of Bundaberg, 180&#xa0;km from the closest <italic>M. integrifolia</italic> population (<xref ref-type="bibr" rid="B44">Topp et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B24">Mai et&#xa0;al., 2020</xref>). The genus <italic>Macadamia</italic> displays diversity in several morphological characteristics. These include the number of leaves per whorl, mature leaf size and shape, color of new leaves, presence of petiole, leaf margin serration, and differences in floral and fruit morphology (<xref ref-type="bibr" rid="B35">Peace, 2005</xref>). These characteristics are used for differentiating <italic>Macadamia</italic> species. However, some of these characteristics, such as leaf serration, can overlap across species and can be observed only at a certain stage (i.e., juvenile or adult) of the life cycle of some species. On the other hand, traits like nut and leaf size can vary within species depending on the environment and may not always be useful in distinguishing between the species (<xref ref-type="bibr" rid="B35">Peace, 2005</xref>; <xref ref-type="bibr" rid="B10">Hardner et&#xa0;al., 2009</xref>). Genomic information on the representative accessions of these four species can be instrumental in understanding the diversity and species distribution of <italic>Macadamia.</italic>
</p>
<p>Although genomic investigation in macadamia commenced a decade ago, only a few studies have been conducted to date. Several types of polymorphic molecular markers have been used to assess the genetic diversity in <italic>Macadamia</italic> (<xref ref-type="bibr" rid="B35">Peace, 2005</xref>; <xref ref-type="bibr" rid="B25">Mast et&#xa0;al., 2008</xref>; <xref ref-type="bibr" rid="B2">Ahmad Termizi et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B3">Alam et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B34">O&#x2019;Connor et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B24">Mai et&#xa0;al., 2020</xref>). However, few studies have been employed to characterize the genetic makeup of wild germplasm (<xref ref-type="bibr" rid="B24">Mai et&#xa0;al., 2020</xref>). In 2005, Peace et&#xa0;al. studied a large number of wild germplasm accessions using low-throughput RAF (randomly amplified DNA fingerprinting) and RAMiFi (randomly amplified microsatellite fingerprinting) markers (<xref ref-type="bibr" rid="B35">Peace, 2005</xref>). Another study by <xref ref-type="bibr" rid="B25">Mast et&#xa0;al. (2008)</xref> investigated the relationships between the four <italic>Macadamia</italic> species and their closely related wild relatives. They examined chloroplast DNA regions, such as matK, atpB, and ndhF and nuclear DNA genomic regions, such as waxy loci 1 and 2 and PHYA. By analyzing these markers, their aim was to gain insights into the complex relationships within the <italic>Macadamia</italic> genus and its wild relatives (<xref ref-type="bibr" rid="B25">Mast et&#xa0;al., 2008</xref>). However, these markers gave low genome coverage and provided poor marker density (<xref ref-type="bibr" rid="B3">Alam et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B31">Nock et&#xa0;al., 2020</xref>). <xref ref-type="bibr" rid="B2">Ahmad Termizi et&#xa0;al. (2016)</xref> analyzed individuals from wild <italic>M. integrifolia</italic> population using 516 single-nucleotide polymorphisms (SNPs) and reported the unique chlorotypes for each of the 12 samples (<xref ref-type="bibr" rid="B2">Ahmad Termizi et&#xa0;al., 2016</xref>). Furthermore, a recent study (<xref ref-type="bibr" rid="B24">Mai et&#xa0;al., 2020</xref>) examined the genetic relationships among 302 wild germplasm accessions using 2,872 SNPs and 8,415 <italic>in silico</italic> DArT markers and identified the species status of 94 unknown wild accessions. Although these studies examined the phylogenetic relationships among wild macadamia accessions, no previous study has resolved the phylogeny of the four <italic>Macadamia</italic> species.</p>
<p>In <italic>Macadamia</italic>, as in other plants, uniparentally inherited chloroplast DNA has been used to infer the phylogenetic patterns. However, many studies have documented the occurrence of reticulate evolution of chloroplast in other plant species (<xref ref-type="bibr" rid="B28">Nge et&#xa0;al., 2021</xref>). The phenomenon of reticulate evolution may result in the replacement of chloroplast genomes of one species with another (<xref ref-type="bibr" rid="B15">Kawabe et&#xa0;al., 2018</xref>) due to hybridization events. In many plants, reticulate evolution has caused a discordance between the molecular data derived from the chloroplast and the nuclear genome (<xref ref-type="bibr" rid="B28">Nge et&#xa0;al., 2021</xref>), resulting in conflicting topologies for phylogenetic trees (<xref ref-type="bibr" rid="B36">Rieseberg and Soltis, 1991</xref>). Therefore, reticulate evolution can have an impact on phylogenetic analyses that rely only on the chloroplast genomes or their genes (<xref ref-type="bibr" rid="B15">Kawabe et&#xa0;al., 2018</xref>). However, studies to date have not explored phylogenetic relationships in <italic>Macadamia</italic> based on both nuclear and complete chloroplast genomes.</p>
<p>Here, we focused on uncovering the diversity and relationships in wild <italic>Macadamia</italic> populations by using both chloroplast genomes and nuclear gene coding sequences (CDS). This is the first whole-genome sequencing data report for a large <italic>Macadamia</italic> population. To support improved conservation and utilization of the wild genetic resources, we sequenced whole chloroplast and nuclear genomes to better understand diversity within and relationships between species and populations of <italic>Macadamia</italic> in Australia.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Plant materials, DNA extraction, and sequencing</title>
<p>A total of 166 wild macadamia accessions representing all four species [<italic>M. integrifolia</italic> (<italic>n</italic> = 49), <italic>M. tetraphylla</italic> (<italic>n</italic> = 56), <italic>M. ternifolia</italic> (<italic>n</italic> = 23), and <italic>M. jansenii</italic> (<italic>n</italic> = 23)] and one related rainforest species from the Proteaceae, <italic>Lasjia whelanii</italic>, were selected for sequencing. Within the macadamia populations, 161 wild accessions, which were collected previously from multiple locations across the natural distribution of the four species, were grown and maintained at Nambour arboretum and <italic>ex situ</italic> germplasm centers at Nambour and Tiaro in Queensland and Alstonville in NSW (<xref ref-type="bibr" rid="B9">Hardner et&#xa0;al., 2004</xref>) and five from a private collection at Limpinwood, NSW (<xref ref-type="supplementary-material" rid="ST1">
<bold>Supplementary Table&#xa0;1</bold>
</xref>) in Australia. Fully expanded young macadamia leaves, of accession within these <italic>ex situ</italic> collection sites, were collected in perforated labeled cellophane bags and immediately placed under dry ice until stored in a &#x2212;80&#xb0;C freezer at The University of Queensland, Brisbane, Australia.</p>
<p>Frozen leaves were coarse pulverized under liquid nitrogen using a mortar and pestle and further fine pulverized under cryogenic conditions using a Qiagen tissue lyser (MM400, Retsch, Germany). A modified version of the cetyltrimethylammonium bromide (CTAB) DNA extraction protocol described by <xref ref-type="bibr" rid="B8">Furtado (2014)</xref> was used to extract genomic DNA. The quality and quantity of the DNA samples were evaluated using a Nanodrop spectrophotometer (Nanodrop Technologies, Wilmington, DE, USA) by recording the absorbance ratios at 260/280 and 260/230 followed by running a 0.7% agarose gel with SYBR safe staining (Thermo Fisher Scientific). Whole-genome short-read sequencing was undertaken by BGI Hong Kong. A PCR-free library was generated and sequencing at 150-bp paired-end reads was undertaken on the DNBSEQ-G400 sequencing platform from MGI (MGI Tech Co., Ltd, Shenzhen, China) at an expected data yield/sample of at least 25&#xd7; genome size (800 Mb genome)</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Chloroplast genome assembly and annotation</title>
<p>All sequence data were analyzed in CLC Genomics Workbench 23.0.05 (CLC-GWB, CLC-Bio, QIAGEN, Denmark, <ext-link ext-link-type="uri" xlink:href="http://www.clcbio.com">http://www.clcbio.com</ext-link>) using the short-read pipeline. Quality control (QC) was performed for all short-read data. Reads were trimmed using a quality score limit of 0.01 with default parameters (more than 98% of the resulted trimmed reads had a Phred score &gt;25). A subset of quality trimmed short reads (2&#x2013;13 GB) was used for chloroplast genome assembly. All chloroplast genomes were assembled using the GetOrganelle toolkit (<xref ref-type="bibr" rid="B14">Jin et&#xa0;al., 2020</xref>) exploiting SPAdes v.3.15.3, Bowtie2 v.2.4.5, and Blast v.2.11.0 as dependencies. The correct configuration of the chloroplast genome was selected with respect to the <italic>M. integrifolia</italic> (sequence: NC_025288.1) (<xref ref-type="bibr" rid="B30">Nock et&#xa0;al., 2014</xref>) available at the National Center for Biotechnology Information (NCBI) (<ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/">http://www.ncbi.nlm.nih.gov/</ext-link>) using clone manager software (Sci Ed, USA).</p>
<p>The chloroplast genomes were annotated using the GeSeq online tool (<ext-link ext-link-type="uri" xlink:href="https://chlorobox.mpimp-golm.mpg.de/geseq.html">https://chlorobox.mpimp-golm.mpg.de/geseq.html</ext-link>) with <italic>M. integrifolia</italic> (sequence: NC_025288.1) as the genome (<xref ref-type="bibr" rid="B43">Tillich et&#xa0;al., 2017</xref>). Chloroplast genomes were annotated with the following settings: Annotation options: Annotate plastid inverted repeat (IR), Annotated plastid trans spliced rps12, Annotation support: Support annotation by Chloe, Annotation revision: Keep best annotation only, BLAT search&#x2013;protein search identity: 25, rRNA, tRNA, and DNA search identity: 85, HMMER profile: CDS+rRNA, ARAGORN v1.2.38- Genetic code: Bacterial/plant chloroplast, Max intron length: 3,000, tRNAscan-se v2.0.7- sequence source: organellar tRNAs, MPI-MP reference set: chloroplast land plants (CDS + rRNA) and Chloe v0.1.0- annotate- CDS + tRNA + rRNA. All genomes were imported to Geneious 2023.2.1 software (Biomatters Ltd, USA) to determine the number of genes, CDS, transfer RNAs (tRNAs), and ribosomal RNAs (rRNAs) in each sample.</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Concatenated nuclear gene CDS sequences</title>
<p>Previously published annotated sequences of the nuclear genome of <italic>M. integrifolia</italic> (<xref ref-type="bibr" rid="B31">Nock et&#xa0;al., 2020</xref>) were selected as reference sequences to generate accession-specific consensus CDS of nuclear genes. CDS of <italic>M. integrifolia</italic> (GCF 013358625.1) were downloaded and imported to CLC-GWB to generate a local Blast database. The CDS of 106 <italic>Arabidopsis thaliana</italic> single-copy genes identified by <xref ref-type="bibr" rid="B19">Li et&#xa0;al. (2017)</xref> was subjected to tblastn against the <italic>M. integrifolia</italic> CDS database. We selected 56 tblastn hits with a single <italic>M. integrifolia</italic> CDS matching an <italic>A. thaliana</italic> CDS as these hits represented single-copy genes in the <italic>M. integrifolia</italic> genome. From these selected single hits, corresponding <italic>M. integrifolia</italic> CDS sequences were extracted and used as a reference to extract consensus sequences from each of the macadamia accessions and from <italic>L. whelanii</italic>. BLAST analysis using the 56 extracted <italic>M. integrifolia</italic> CDS and the CDS sequences of <italic>L. whelanii</italic> as a database resulted in the selection of 53 <italic>L. whelanii</italic> CDS as single hits that represented single-copy genes in <italic>L. whelanii</italic>. Corresponding (same as selected) 53 CDS sequences from <italic>M. integrifolia</italic> and from <italic>L. whelanii</italic> were selected for further analysis. The 53 CDS from <italic>M. integrifolia</italic> (<xref ref-type="supplementary-material" rid="ST2">
<bold>Supplementary Table&#xa0;2</bold>
</xref>) were used as reference sequences in the read mapping approach to generate corresponding CDS consensus sequences for each of the macadamia accessions. Essentially, short reads trimmed data of each macadamia accession were mapped separately to each of the 53 selected <italic>M. integrifolia</italic> CDS sequences to extract consensus sequences. Finally, consensus CDS sequences, were extracted for each macadamia accession, and were concatenated in the same sequential order to obtain the final nuclear gene CDS sequence.</p>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Phylogenetic evaluation</title>
<p>Phylogenetic evaluation of macadamia was conducted by utilizing complete chloroplast genome sequences and single-copy concatenated nuclear gene CDS sequences. For phylogenetic analysis, we selected 138 wild macadamia accessions representing all four species. To maintain precision and clarity within our analysis, we exclude accessions from planted wild germplasm, accessions known to be natural hybrids, admixtures, accessions of unknown origin, and unidentified macadamia accessions (<xref ref-type="supplementary-material" rid="ST3">
<bold>Supplementary Table&#xa0;3</bold>
</xref>). The phylogenetic trees were also generated for four species: <italic>M. integrifolia</italic> (<italic>n</italic> = 44), <italic>M. tetraphylla</italic> (<italic>n</italic> = 49), <italic>M. ternifolia</italic> (<italic>n</italic> = 22), and <italic>M. jansenii</italic> (<italic>n</italic> = 23) separately based on chloroplast genomic data and single-copy nuclear gene sequences. <italic>L. whelanii</italic> was used as an outgroup. All selected sequences were aligned along with the outgroup using MAFFT alignment with default parameters in Geneious 2023.2.1 software (Biomatters Ltd, USA).</p>
<sec id="s2_4_1">
<label>2.4.1</label>
<title>Chloroplast phylogenetic analysis</title>
<p>Chloroplast genomes are widely used in plant phylogenetic analysis (<xref ref-type="bibr" rid="B48">Yanfei et&#xa0;al., 2023</xref>). Therefore, phylogenetic trees were constructed using complete chloroplast genome sequences to investigate the relationships in genus <italic>Macadamia</italic>. To better determine the relationships within the Macadamia species, we first constructed Maximum Likelihood (ML) trees and Bayesian trees for all four species separately using <italic>L. whelanii</italic> as an outgroup.</p>
<p>Chloroplast phylogenetic reconstructions were performed using PAUP*v 4.0 software (<xref ref-type="bibr" rid="B41">Swofford and Sullivan, 2003</xref>) with the maximum likelihood (ML) method and MrBayes v. 3.2 software (<xref ref-type="bibr" rid="B37">Ronquist et&#xa0;al., 2012</xref>) in Geneious for Bayesian inference (BI) method. For PAUP* trees, the Akaike Information Criterion (AIC) in the jModel test was performed in Cyberinfrastructure for Phylogenetic Research (CIPRES) Science Gateway (<ext-link ext-link-type="uri" xlink:href="https://www.phylo.org/">https://www.phylo.org/</ext-link>) to find out the best-fitting nucleotide substitution model (<xref ref-type="bibr" rid="B26">Miller et&#xa0;al., 2010</xref>). ML analysis was performed with 1,000 bootstrap replicates. GTR + Gamma was used in BI analysis. The chloroplast ML tree for the <italic>M. integrifolia</italic> and <italic>M. tetraphylla</italic> populations were generated by the TPM1uf+I+G model and chloroplast ML tree for <italic>M. ternifolia</italic> were generated by the TVM+G model. The topological structures of trees were evaluated based on bootstrap support and Bayesian posterior probabilities. The Interactive Tree of Life (iTOL) v.5 tool (<xref ref-type="bibr" rid="B18">Letunic and Bork, 2021</xref>) (<ext-link ext-link-type="uri" xlink:href="https://itol.embl.de/about.cgi">https://itol.embl.de/about.cgi</ext-link>) was used to visualize the phylogenies.</p>
<p>To further evaluate the phylogenetic relationship between the four species of macadamia, we constructed Bayesian tree methods (GTR + Gamma model) by taking 138 complete macadamia chloroplast genomes using <italic>L. whelanii</italic> as an outgroup.</p>
</sec>
<sec id="s2_4_2">
<label>2.4.2</label>
<title>Nuclear gene phylogenetic analysis</title>
<sec id="s2_4_2_1">
<label>2.4.2.1</label>
<title>Concatenation based phylogeny</title>
<p>Concatenated 53 nuclear gene CDS sequences of <italic>Macadamia</italic> species and <italic>L. whelanii</italic> were used to evaluate the phylogenetic relationships in the genus <italic>Macadamia</italic>. The nuclear gene phylogenetic trees were generated by using Randomized Axelerated Maximum Likelihood (RAxML) version 8 (<xref ref-type="bibr" rid="B39">Stamatakis, 2014</xref>) with the ML method and the BI method in MrBayes v. 3.2 software (<xref ref-type="bibr" rid="B37">Ronquist et&#xa0;al., 2012</xref>) in Geneious 2023.2.1 software (Biomatters Ltd, USA). ML trees were analyzed using the GTR + GAMMA nucleotide model with 1,000 bootstrap replicates. The BI trees were analyzed using the GTR + GAMMA model. The phylogenetic trees were visualized with the iTOL v.5 tool (<xref ref-type="bibr" rid="B18">Letunic and Bork, 2021</xref>). The topological structure of trees produced by RAxML and MrBayes software was compared to identify discrepancies between them.</p>
</sec>
<sec id="s2_4_2_2">
<label>2.4.2.2</label>
<title>Single Nucleotide Polymorphisms (SNPs) based phylogeny</title>
<p>The CDS from 53 genes from <italic>M. integrifolia</italic> (<xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table 2</bold></xref>) were analysed by BLASTed against CDS extracted for <italic>M. integrifolia</italic> (GWHESFF00000000), <italic>M. tetraphylla</italic> (GWHESFG00000000), <italic>M. ternifolia</italic> (GWHESEN00000000) and <italic>M. jansenii</italic> (GWHESFI00000000) (<xref ref-type="bibr" rid="B38">Sharma et al., 2023</xref>) from Genome warehouse (<uri xlink:href="https://ngdc.cncb.ac.cn/gwh/">https://ngdc.cncb.ac.cn/gwh/</uri>) in CLC Genomics Workbench 23.0.05 (CLC-GWB, CLC-Bio, QIAGEN, Denmark, <uri xlink:href="http://www.clcbio.com">http://www.clcbio.com</uri>). The BLAST hits were manually checked. We selected 45 BLAST hits with a single hit for each species (<xref ref-type="supplementary-material" rid="ST4"><bold>Supplementary Table 4</bold></xref>). Then, short reads were trimmed using a 0.01 quality threshold. All the samples were independently mapped to the respective reference genomes of the four species. The mapping setting was as follows: Masking mode (No), Match score (1), Mismatch score (2), Insertion cost (3), Deletion cost (3), Length fraction (1.0), Similarity fraction (0.9) and Global alignment (No). To identify variants, present in selected 45 CDS, the read mappings were then subjected to a Fixed ploidy variant detection tool in CLC Genomics Workbench 23.0.05 (CLC-GWB, CLC-Bio, QIAGEN, Denmark, <uri xlink:href="http://www.clcbio.com">http://www.clcbio.com</uri>). Fixed ploidy variant detection was conducted at the settings as follows; minimum coverage (10), minimum count (3) and minimum frequency (%) (25%). Then, Heterozygous SNP variants were manually filtered for a frequency range of 25 &#x2013; 75% for the two alleles with respect to the reference genomes. Homozygous SNP variants were manually filtered for 100% frequency.  Variants for outgroup <italic>L.&#xa0;whelanii</italic> were identified with respect to the <italic>M. integrifolia</italic> (GWHESFF00000000) reference genome. Individual heterozygous and 100% homozygous variant files were combined to produce a comma separated value format (CSV) tables for each of the 45 CDS in all samples. The CSV files with a final set of SNPs were used to reconstruct CDS sequences for each sample using a Python script (<uri xlink:href="https://github.com/Aeyohan/aght">https://github.com/Aeyohan/aght</uri>). Reconstructed CDS sequences were then aligned with the outgroup using MAFFT alignment with default parameters in Geneious 2023.2.1 software (Biomatters Ltd, USA). Individual gene trees were generated using RAxML version 8 (<xref ref-type="bibr" rid="B39">Stamatakis, 2014</xref>) with the ML method in Geneious 2023.2.1 software (Biomatters Ltd, USA). ML trees were analysed using the GTR +GAMMA nucleotide model with 1000 bootstrap replicates. Then, individual gene trees were used to construct ASTRAL tree (<xref ref-type="bibr" rid="B50">Zhang et al., 2018</xref>). The  Interactive Tree Of Life (iTOL) v.5 tool (<xref ref-type="bibr" rid="B18">Letunic and Bork, 2021</xref>) (https://itol.embl.de/about.cgi) was used to visualize the phylogeny.</p>
</sec>
</sec>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Assessment of phylogeography</title>
<p>Geographical maps of origin were created for all four macadamia species based on the chloroplast phylogenetic clade separation. Geographic ranges were mapped using Esri National Geographic in the QGIS Geographic Information System (Version 3.32.1-Lima) (<ext-link ext-link-type="uri" xlink:href="http://qgis.osgeo.org">http://qgis.osgeo.org</ext-link>). Geographical coordinates of each accession are listed in <xref ref-type="supplementary-material" rid="ST3">
<bold>Supplementary Table&#xa0;3</bold>
</xref>.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>Characterization of chloroplast genomes</title>
<p>Following paired-end sequencing (150 bp), a total of 140,789,058&#x2013;260,592,896 reads were obtained for 166 <italic>Macadamia</italic> accessions (<xref ref-type="supplementary-material" rid="ST5">
<bold>Supplementary Table&#xa0;5</bold>
</xref>) with sequence depth of 18.23&#xd7; and 50&#xd7;. The sequence depth of trimmed paired-end reads at a quality score limit of 0.01 ranged between 16.47&#xd7; and 43.98&#xd7;. Two assembled sequences were obtained from GetOrganelle analysis indicating the presence of two structural haplotypes of the chloroplast genome that occurs in plants related to the orientation of the single-copy region. The correct configuration of the chloroplast genome was selected with respect to <italic>M. integrifolia</italic> (Reference sequence: NC_025288.1). Complete chloroplast genome sizes analyzed in this study are shown in <xref ref-type="supplementary-material" rid="ST6">
<bold>Supplementary Table&#xa0;6</bold>
</xref>. Complete circular chloroplast genomes were obtained for all genotypes, ranging in size from 159,195 to 159,734 bp. The smallest chloroplast genome was identified for three <italic>M. tetraphylla</italic> accessions (Mac_297, Mac_338, and Mac_345) and two wild macadamia trees of uncertain species (Mac_047 and Mac_329) while the largest was observed for two <italic>M. integrifolia</italic> accessions (Mac_029 and Mac_262). Chloroplast genome sizes of <italic>M. integrifolia</italic> ranged from 159,458 to 159,734 bp, those of <italic>M. ternifolia</italic> ranged from 159,463 to 159,508 bp, those of <italic>M. tetraphylla</italic> ranged from 159,195 to 159,598 bp, and <italic>M. jansenii</italic> were 159,524 bp in length except for MacP_16 (159,526 bp). The result of this study also revealed that out of 23 <italic>M. jansenii</italic> accessions, 22 accessions had identical chloroplast genomes.</p>
<p>All macadamia chloroplast genomes showed a quadripartite structure of angiosperm, including a large single copy (LSC), a small single copy (SSC), and two identical inverted repeats (IRa and IRb) (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>). Gene annotation showed 116 full-length genes, 81 CDS, 4 rRNAs, and 31 tRNAs. Among these 116 genes, 60 genes were involved in protein synthesis and DNA replication (genes responsible for rRNAs, tRNAs, large subunit of ribosome, small subunit of ribosome, and DNA-dependent RNA polymerase), 46 were involved in photosynthesis (genes responsible for subunits of photosystem I, subunits of photosystem II, subunits of ATP synthase, subunits of NADH dehydrogenase, large subunit of rubisco, and subunits of cytochrome complex), 6 were involved in other different functions (genes responsible for inner membrane protein, cytochrome synthesis gene, acetyl-CoA-carboxylase, maturase, ATP-dependent protease, and translational initiation factor), and 4 were involved in unknown function genes (<xref ref-type="supplementary-material" rid="ST7">
<bold>Supplementary Table&#xa0;7</bold>
</xref>).</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>The circular chloroplast genome map of four <italic>Macadamia</italic> species and <italic>Lasjia whelanii</italic>. Genes inside the circle are transcribed in the clockwise direction whereas the genes outside the circle are transcribed in the counterclockwise direction. Genes belonging to different functional groups are colour coded. Gray area in the inner circle indicates the GC content of the chloroplast genome. The four regions of a chloroplast genome are also indicated in the inner circle: the two inverted repeat regions (IRA and IRB) are separated by small (SSC) and large (LSC) single copy regions.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1394244-g001.tif"/>
</fig>
<p>The <italic>L. whelanii</italic> chloroplast genome possessed the standard quadripartite structure, containing two inverted repeats (18,824 bp), the LSC region (87,911 bp), and the SSC region (26,448 bp). (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>). Genome size was recorded as 159,631 bp. The plastome of <italic>L. whelanii</italic> contained no significant difference in relation to genes, protein coding genes, rRNA, and tRNA. Overall, the GC content of the chloroplast genome was recorded as 38%.</p>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Chloroplast phylogeny and geographical analysis of <italic>Macadamia</italic> species</title>
<p>The multiple chloroplast genome alignment of 44 <italic>M. integrifolia</italic> accessions together with the outgroup <italic>L. whelanii</italic> was 161,281 bp in length with 99.6% identical sites. The tree topologies of both were similar (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2A</bold>
</xref>), and most nodes were supported by high bootstrap support (BS) (&gt;95%) and Bayesian posterior probabilities (PP) (&gt;0.95). However, some internal nodes tended to have low BS, indicating incomplete lineage sorting. The phylogenetic tree construction revealed that Mac_232 (corresponding to population site 90) clusters separately from the rest of the 43 accessions. The remaining accessions were differentiated into two main clades and further differentiated into sub-clades. Clade II contained accessions from the northern distribution of <italic>M. integrifolia</italic>: Mac_231, Mac_262, Mac_029, Mac_265, and Mac_033 from the Gundiah/Mount Bauple region (corresponding to population sites 1, 2, 2, 3, and 3, respectively) (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2B</bold>
</xref>) and Mac_052, Mac_091, Mac_340, Mac_248, and Mac_266 from the Gympie region (corresponding to population sites 9, 55, 56, 57, and 57, respectively). Clade III included a total of nine accessions, of which seven were from the Caboolture region: Mac_250, Mac_312, Mac_246, Mac_045, Mac_080, Mac_026, and Mac_143 (corresponding to population sites 20, 21, 21, 71, 76, 76, and 77, respectively) and one from the Nambour region: Mac_044 (corresponding to population site 101). Interestingly, Mac_059 from population site 57 did not cluster with two other accessions (Mac_248 and Mac_266) from population site 57 (Gympie region) in Clade I. Clade IV contained 24 accessions that were collected from the region south of Brisbane except for Mac_251, Mac_089, Mac_139, and Mac_189 (corresponding to population sites 3, 90, 90, and 90, respectively). This observation verified that the accessions having the same geographical origin tend to form distinct clusters among themselves. However, it is noteworthy that certain accessions from these localities exhibit a tendency to associate or cluster with accessions sourced from different geographical areas. The result of this study also revealed that Mac_251, Mac_089, Mac_139, and Mac_189 (corresponding to population sites 3, 90, 90, and 90, respectively) are likely to be planted trees. Mac_312, Mac_246 and Mac_306, Mac_228 are biological replicates and confirmed by clustering together. Additionally, the short branch length of the tree suggested that Mac_232 had less divergence while Mac_026, Mac_044, Mac_080, and Mac_143 from Clade III were more diverged accessions.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>
<bold>(A)</bold> Chloroplast phylogeny of <italic>M. integrifolia</italic> using the ML and BI method. <bold>(B)</bold> Phylogeographic analysis of <italic>M. integrifolia</italic>. Numbers above the lines represent ML bootstrap support/Bayesian posterior probabilities. Numbers indicate corresponding population site (<xref ref-type="supplementary-material" rid="ST3"><bold>Supplementary Table 3</bold></xref>). Light blue: Clade I, Red: Clade II, Purple: Clade III and Green: Clade IV. Coloured dots on the map indicate the corresponding clade in chloroplast phylogenetic tree. Two red circles highlight population site number which contained accessions from different clades.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1394244-g002.tif"/>
</fig>
<p>To study the phylogenetic relationship of <italic>M. tetraphylla</italic>, phylogenetic trees were constructed using 49 complete chloroplast genome sequences. The multiple chloroplast genome alignment of <italic>M. tetraphylla</italic> accessions together with the outgroup <italic>L. whelanii</italic> was 161,554 bp in length with 96% identical sites. ML and BI trees exhibited similar phylogenetic topologies (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3A</bold>
</xref>). The resulting phylogenetic tree showed strong statistical support for most internal and external nodes but barring poor BS value for some internal nodes. However, in the Bayesian chloroplast tree, the highest PP value of 1 was observed for all the nodes. The chloroplast tree displayed two major clades. The first major clade (Clade I) consisted of germplasm collected from the southern part: the Lismore region (Mac_060, Mac_108, Mac_134, Mac_268, Mac_244, Mac_031, Mac_297, Mac_184, Mac_083, and Mac_095) and the Ballina region (Mac_247, Mac_325, MacP_14, and Mac_115) except for MacP_15 (corresponding to population site 31) and Mac_097 (corresponding to population site 38) (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3B</bold>
</xref>). The second major clade was further divided into sub-clades. Clade II contained accessions from the Murwillumbah region: Mac_341, Mac_314, Mac_227, Mac_270, Mac_098, Mac_064, Mac_291, and Mac_259 (corresponding to population sites 37, 37, 81, 160, 160, 160, 160, and 160, respectively) and the Beenleigh region: Mac_236 (corresponding to population site 100). Two accessions from Clade III from population site 37 clustered separately from the rest of the accessions from the same geographical location. However, as in the <italic>M. integrifolia</italic> chloroplast phylogenetic tree, the majority of <italic>M. tetraphylla</italic> tended to form distinct clusters among themselves based on geographical areas. Results also indicated that Mac_031, Mac_244, and Mac_268 from population site 96 (Clade I) and Mac_264 and Mac_238 from population site 84 (Clade VI) were highly diverged accessions.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>
<bold>(A)</bold> Chloroplast phylogeny of <italic>M. tetraphylla</italic> using the ML and BI method. <bold>(B)</bold> Phylogeographic analysis of <italic>M. tetraphylla</italic>. Numbers above the lines represent ML bootstrap support/Bayesian posterior probabilities. Numbers indicate corresponding population site (<xref ref-type="supplementary-material" rid="ST3"><bold>Supplementary Table 3</bold></xref>). Red: Clade I, Green: Clade II, Brown: Clade IIII, Orange: Clade IV, Light blue: Clade V and Purple: Clade VI. Coloured dots on the map indicate the corresponding clade in chloroplast phylogenetic tree. Four red circles highlight population site number which contained accessions from different clades.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1394244-g003.tif"/>
</fig>
<p>The phylogenetic relationships within <italic>M. ternifolia</italic> accessions were inferred by 22 assembled complete chloroplast genomes. A multiple chloroplast alignment conducted using an outgroup was 160,807 bp with 97.2% identical sites. Phylogenetic trees built with the whole chloroplast genome using both methods had the same topology (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>). The results showed two major clades having MacP_11, Mac_309, and MacP_12 from Nambour (corresponding to population site 88) (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4B</bold>
</xref>) in one major clade and the remaining accessions in the second major clade. There was a clear relationship between the phylogenetic structure and geographic origin of the wild accessions of <italic>M. ternifolia</italic>. The resulting topology suggested accessions from Clade IV: Mac_299, Mac_071, Mac_317, Mac_332, and Mac_334 (corresponding to population sites 20, 51, 51, 51, and 51, respectively) were highly diverged accessions. In the <italic>M. jansenii</italic> population, no variants were observed, indicating that all accessions shared the same chloroplast haplotypes except for MacP_16 with a 2-bp difference.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>
<bold>(A)</bold> Chloroplast phylogeny of <italic>M. ternifolia</italic> using the ML and BI method. <bold>(B)</bold> Phylogeographic analysis of <italic>M. ternifolia</italic>. Numbers above the lines represent ML bootstrap support/Bayesian posterior probabilities. Numbers indicate corresponding population site (<xref ref-type="supplementary-material" rid="ST3"><bold>Supplementary Table 3</bold></xref>). Purple: Clade I, Green: Clade II, Red: Clade IIII, Light blue: Clade IV and Orange: Clade V. Coloured dots on the map indicate the corresponding clade in chloroplast phylogenetic tree.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1394244-g004.tif"/>
</fig>
<p>The chloroplast phylogeny tree generated by taking 138 complete chloroplast genomes was supported with a PP of 1.0. Two major clades were identified (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>). The first major clade contained 16 <italic>M. tetraphylla</italic> accessions from the Lismore region (Mac_060, Mac_108, Mac_134, Mac_268, Mac_244, Mac_031, Mac_297, Mac_184, Mac_083, and Mac_095), the Ballina region (Mac_247, Mac_325, MacP_14, and Mac_115), the Beenleigh region (MacP_15), and the Murwillumbah region (Mac_097). Interestingly, all these accessions corresponded to Clade I in <italic>M. tetraphylla</italic> chloroplast phylogenetic tree (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3A</bold>
</xref>). The second major clade was further differentiated into two sub-clades. All the <italic>M. jansenii</italic> accessions were clustered in one clade. The second sub-clade was further divided into two clades. The small sub-clade contained 10 accessions from the northern distribution of <italic>M. integrifolia</italic> (corresponding to Clade II in the <italic>M. integrifolia</italic> Cp phylogenetic tree) and 1 accession from the Nambour region (corresponding to Clade I in the <italic>M. integrifolia</italic> Cp phylogenetic tree). The larger sub-clade contained all the remaining <italic>M. tetraphylla</italic>, <italic>M. integrifolia</italic>, and <italic>M. ternifolia.</italic> This result shows that accessions that were collected from same locality cluster together. We assumed that chloroplast capture could be the reason for the presence of different species in the same clade when a species coexists in the same geographic area with other species.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Chloroplast phylogeographic results of <italic>Macadamia</italic> species. <bold>(A)</bold> Chloroplast phylogenetic tree of Macadamia using BI method. Light blue: <italic>M. tetraphylla</italic>, Purple: <italic>M. jansenii</italic>, Red: <italic>M. integrifolia</italic> and Green: <italic>M. ternifolia</italic>. Numbers above the lines represent Bayesian posterior probabilities. <bold>(B)</bold> Map of Australia showing origins of Macadamia accessions. Numbers indicate corresponding population site (<xref ref-type="supplementary-material" rid="ST3"><bold>Supplementary Table 3</bold></xref>). Coloured dots on the map indicate the corresponding species. Three red circles highlight population site number which contained accessions from different species.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1394244-g005.tif"/>
</fig>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Nuclear gene phylogenetic analysis</title>
<sec id="s3_3_1">
<label>3.3.1</label>
<title>Concatenation based phylogeny</title>
<p>For <italic>M. integrifolia</italic>, we used a total of 44 accessions. The multiple sequence alignment was 81,747 bp in length with 91% identical sites. The topology of the nuclear gene phylogenetic tree constructed based on both ML and BI methods was nearly identical (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;1</bold>
</xref>, <xref ref-type="supplementary-material" rid="SM1">
<bold>2</bold>
</xref>). However, the resulting phylogenetic trees exhibited low bootstrap values (&lt;70) and Bayesian posterior probabilities (&lt;0.95). Moreover, this result was not congruent with the results of the chloroplast phylogenetic tree.</p>
<p>The nucleotide alignment of 49 <italic>M. tetraphylla</italic> accessions along with the outgroup, was 81,753 bp in length. The phylogeny obtained with the ML approach was nearly identical to the BI approach (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;3</bold>
</xref>, <xref ref-type="supplementary-material" rid="SM1">
<bold>4</bold>
</xref>). Similar to <italic>M. integrifolia</italic> branching, the support rate is low. The tree topology of nuclear gene phylogeny and chloroplast phylogeny are dissimilar. Next, we constructed nuclear phylogenetic trees for <italic>M. ternifolia</italic> (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;5</bold>
</xref>, <xref ref-type="supplementary-material" rid="SM1">
<bold>6</bold>
</xref>) and <italic>M. jansenii</italic> (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;7</bold>
</xref>, <xref ref-type="supplementary-material" rid="SM1">
<bold>8</bold>
</xref>) populations with the ML and BI methods. However, the resulting topologies had poor statistical support for internal and external nodes.</p>
<p>An ML tree was also constructed for 138 macadamia genotypes based on the concatenated single-copy nuclear gene CDS. The ML tree demonstrated the presence of four distinct species in the genus <italic>Macadamia</italic>. This well-supported tree classified the population into two main clades (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>). The main Clade I consisted of <italic>M. ternifolia</italic> and <italic>M. jansenii</italic> while Clade II consisted of all <italic>M. integrifolia</italic> and <italic>M. tetraphylla</italic>. This outcome underscored the close relationship between <italic>M. ternifolia</italic> and <italic>M. jansenii</italic> and also that between <italic>M. integrifolia</italic> and <italic>M. tetraphylla</italic>.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Nuclear phylogenetic results of <italic>Macadamia</italic> species. Light blue: <italic>M. tetraphylla</italic>, Purple: <italic>M. jansenii</italic>, Red: <italic>M. integrifolia</italic> and Green: <italic>M. ternifolia</italic>. Numbers above the lines represent ML bootstrap support. Phylogenetic tree constructed from coding sequences of 53 single copy genes using 1000 bootstrap replicates. Accessions were colour coded according to the species.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1394244-g006.tif"/>
</fig>
</sec>
<sec id="s3_3_2">
<label>3.3.2</label>
<title>Single Nucleotide Polymorphisms (SNPs) based phylogeny</title>
<p>SNPs based phylogenetic tree for individual genes generated by talking 138 samples was supported with low bootstrap values (&lt;70) (<xref ref-type="supplementary-material" rid="SM2"><bold>Supplementary Figure 9</bold></xref>). However, the ASTRAL tree exhibited high local posterior probability support (LPP) values for external nodes (/1) (<xref ref-type="supplementary-material" rid="SM3"><bold>Supplementary Figure 10</bold></xref>). This well-supported tree demonstrated <italic>M. integrifolia</italic> and <italic>M. tetraphylla</italic> in one clade and <italic>M. ternifolia</italic> and <italic>M. jansenii</italic> in another.</p>
</sec>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>Phylogenetics helps to unravel evolutionary histories and provides valuable insights into the factors driving the growth and adaptation of important plant groups worldwide (<xref ref-type="bibr" rid="B17">Lan et&#xa0;al., 2022</xref>). The current study, using whole-genome sequencing, has resolved the phylogeny of the four <italic>Macadamia</italic> species and confirmed that all the wild accessions belonged to four distinct species. Chloroplast genome sequences have been extensively used in Phylogenetic analysis (<xref ref-type="bibr" rid="B40">Sun et&#xa0;al., 2020</xref>). Chloroplasts are the most metabolically active organelle found in plants that carry out most of the biochemical synthesis process, which required the cell to produce energy through photosynthesis (<xref ref-type="bibr" rid="B7">Dobrogojski et&#xa0;al., 2020</xref>). The chloroplast DNA sequence has unique features compared to the nuclear genome in the analysis of population genetics and evolutionary relationships within families, genus, and species (<xref ref-type="bibr" rid="B6">De Las Rivas et&#xa0;al., 2002</xref>; <xref ref-type="bibr" rid="B2">Ahmad Termizi et&#xa0;al., 2016</xref>). The chloroplast genome is present in high copy numbers, has a low rate of spontaneous mutation, and does not undergo crossovers or recombination. Chloroplast genome sequence data are highly conserved (<xref ref-type="bibr" rid="B7">Dobrogojski et&#xa0;al., 2020</xref>). Earlier research relies on the separation of chloroplast genome from the nuclear genome and mitochondrial genome (<xref ref-type="bibr" rid="B13">Jansen et&#xa0;al., 2005</xref>). With the emergence of NGS technology, new high-throughput approaches have been introduced for the successful isolation of chloroplast sequencing with low cost (<xref ref-type="bibr" rid="B2">Ahmad Termizi et&#xa0;al., 2016</xref>). The read length, sequencing depth, sequence coverage or width, and evenness of coverage influence the accuracy of DNA sequencing using NGS technology. Short-read sequencing has been successfully applied to sequence chloroplast genomes of various plant species (<xref ref-type="bibr" rid="B16">Kyriakidou et&#xa0;al., 2018</xref>). Although there were numerous records of the extensive use of chloroplast genomes in evolutionary relationships in plants, very few studies were presented on the whole chloroplast genome data in macadamia. In this study, the size of all chloroplast genomes was consistent with previous macadamia chloroplast genomes (<xref ref-type="bibr" rid="B30">Nock et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B22">Liu et&#xa0;al., 2017</xref>, <xref ref-type="bibr" rid="B23">Liu et&#xa0;al., 2018</xref>). Genome annotation resulted in a higher number of genes compared to previous studies (<xref ref-type="bibr" rid="B30">Nock et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B22">Liu et&#xa0;al., 2017</xref>, <xref ref-type="bibr" rid="B23">Liu et&#xa0;al., 2018</xref>), which reported 79 CDS, 4 rRNA, and 30 tRNA for <italic>M. integrifolia</italic> (<xref ref-type="bibr" rid="B30">Nock et&#xa0;al., 2014</xref>), <italic>M. ternifolia</italic> (<xref ref-type="bibr" rid="B22">Liu et&#xa0;al., 2017</xref>), and <italic>M. tetraphylla</italic> (<xref ref-type="bibr" rid="B23">Liu et&#xa0;al., 2018</xref>). The difference in the gene number was possibly due to the difference in the annotation tool. All the previous genomes were annotated using Dual Organelle GenoMe Annotator (DOGMA) (<xref ref-type="bibr" rid="B47">Wyman et&#xa0;al., 2004</xref>), while the current genomes were annotated using the GeSeq online tool (<ext-link ext-link-type="uri" xlink:href="https://chlorobox.mpimp-golm.mpg.de/geseq.html">https://chlorobox.mpimp-golm.mpg.de/geseq.html</ext-link>). Moreover, there is no previously reported chloroplast genome for <italic>M. jansenii</italic>. For the first time, we have generated chloroplast genomes for 23 <italic>M. jansenii</italic> accessions using the Get Organelle toolkit (<xref ref-type="bibr" rid="B14">Jin et&#xa0;al., 2020</xref>).</p>
<p>This study provides the most comprehensive analysis of the evolutionary relationships of the chloroplasts within the species in the genus <italic>Macadamia</italic>. The topology of the chloroplast phylogenetic tree with the distinct northern population and southern population of <italic>M. integrifolia</italic> is in agreement with the previously published phylogenetic results (<xref ref-type="bibr" rid="B32">Nock et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B20">Lin et&#xa0;al., 2022</xref>). <xref ref-type="bibr" rid="B32">Nock et&#xa0;al. (2019)</xref> also reported two distinct populations, namely, the Gundiah/Mount Bauple and the Gympie populations in the northern clade. A similar result was also reported by <xref ref-type="bibr" rid="B20">Lin et&#xa0;al. (2022)</xref> based on chloroplast and nuclear phylogenetic analysis. However, our results do not clearly separate accessions between the Gundiah/Mount Bauple region: Mac_231, Mac_262, Mac_029, Mac_265, and Mac_033 (corresponding to population sites 1, 2, 2, 3, and 3, respectively) (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2B</bold>
</xref>) and the Gympie region: Mac_052, Mac_091, Mac_340, Mac_248, and Mac_266 (corresponding to population sites 9, 55, 56, 57, and 57, respectively). In this study, the ML/BI phylogenetic tree showed that Mac_232 from Clade I (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2B</bold>
</xref>) was clustered separately from three other accessions in Cluster III (Mac_089, Mac_139, and Mac_189) originating from population site 90, suggesting that it is a planted tree. This finding was also supported by previous SSR results, which indicated that the Dulong tree is a planted tree that originated from the Brisbane region (<xref ref-type="bibr" rid="B29">Nock, 2022</xref>). The results also show that Mac_059 from population site 57 is a planted tree, which was not reported previously. Moreover, all the trees from the Sunshine Coast&#x2014;Mac_089, Mac_139, and Mac_189 (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2A</bold>
</xref>, Clade IV)&#x2014;are likely to be planted trees, which is consistent with previous studies (<xref ref-type="bibr" rid="B32">Nock et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B29">Nock, 2022</xref>). The results revealed that Mac_026, Mac_044, Mac_080, and Mac_143 are highly diverged accessions, in contrast to the previous study (<xref ref-type="bibr" rid="B24">Mai et&#xa0;al., 2020</xref>), in which Mac_229, Mac_266, Mac_139, and Mac_235 were recognized as diverged accessions. The phylogeographic results of the present study were in agreement with those of the previous study by <xref ref-type="bibr" rid="B24">Mai et&#xa0;al. (2020)</xref>. Chloroplast phylogenetic analysis of <italic>M. tetraphylla</italic> revealed that MacP_15 (corresponding to population site 31), Mac_097 (corresponding to population site 38), and Mac_236 (corresponding to population site 100) (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3A, B</bold>
</xref>) might have been moved by humans as they were clustered with accessions from a different locality. It is noteworthy that we identified MacP_15 and Mac_236 to be outside the range of the natural population. <italic>M. tetraphylla</italic> is mostly distributed in the New South Wales region (<xref ref-type="bibr" rid="B44">Topp et&#xa0;al., 2019</xref>). There is no record of natural occurrence in the Beenleigh, QLD region. Previous studies reported a weak genetic differentiation (<xref ref-type="bibr" rid="B33">O'Connor et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B24">Mai et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B29">Nock, 2022</xref>) for <italic>M. tetraphylla</italic> populations. However, the present study revealed a positive correlation between genetics and geographical distribution.</p>
<p>For the first time, we report the phylogeographic pattern of distribution of genetic variation for the <italic>M. ternifolia</italic> population. However, further investigation is needed with an increased number of samples. Results for the <italic>M. jansenii</italic> accessions identified the presence of one chloroplast haplotype as expected due to the small, isolated population. This suggested that <italic>M. jansenii</italic> has gone through a genetic bottleneck. <italic>M. jansenii</italic> is found only in the Bulburin National Park north of Bundaberg, which is 180&#xa0;km away from any <italic>M. integrifolia</italic> population (<xref ref-type="bibr" rid="B44">Topp et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B24">Mai et&#xa0;al., 2020</xref>). Therefore, the possibility of gene flow between the two populations is limited except for the movement of nuts with the involvement of humans. A decrease in the movement of genes is expected to increase the occurrence of inbreeding among individuals in the population (<xref ref-type="bibr" rid="B11">Hatmaker et&#xa0;al., 2018</xref>). Inbreeding, in turn, can have effects on the genetic health of the population, potentially leading to an accumulation of harmful traits and a decrease in overall fitness (<xref ref-type="bibr" rid="B11">Hatmaker et&#xa0;al., 2018</xref>).</p>
<p>In contrast to the previously recorded phylogenies (<xref ref-type="bibr" rid="B35">Peace, 2005</xref>; <xref ref-type="bibr" rid="B25">Mast et&#xa0;al., 2008</xref>; <xref ref-type="bibr" rid="B24">Mai et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B29">Nock, 2022</xref>), we found that accessions that were collected from the same geographical location were closely related. The distinct separation of <italic>Macadamia</italic> populations within species reported in previous phylogenies (<xref ref-type="bibr" rid="B35">Peace, 2005</xref>; <xref ref-type="bibr" rid="B25">Mast et&#xa0;al., 2008</xref>; <xref ref-type="bibr" rid="B24">Mai et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B29">Nock, 2022</xref>) were based on chloroplast genome analysis. This study shows that reticulate evolution has resulted in chloroplast transfer between species and resulted in distinct chloroplast types within individual species but does not affect the distinctness of the nuclear genomes. Although chloroplast capture was not previously reported in Macadamia, many other plants have reported the occurrence of reticulate evolution of the chloroplast (<xref ref-type="bibr" rid="B1">Acosta and Premoli, 2010</xref>; <xref ref-type="bibr" rid="B46">Wambugu et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B49">Yi et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B27">Moner et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B4">Ananda et&#xa0;al., 2021</xref>). In this study, chloroplast phylogeny separated 16 <italic>M. tetraphylla</italic> accessions from the rest of the accessions. The second major clade was further divided into two clades having all <italic>M. jansenii</italic> in one clade and the rest of the accessions in the other. Furthermore, a sub-clade further separated 11 <italic>M. integrifolia</italic> and 24 <italic>M. tetraphylla</italic> accessions, leaving a complex clade having <italic>M. integrifolia</italic>, <italic>M. ternifolia</italic>, and <italic>M. tetraphylla</italic>. This suggested a series of chloroplast capture events between <italic>M. integrifolia</italic>, <italic>M. ternifolia</italic>, and <italic>M. tetraphylla.</italic>
</p>
<p>Phylogenetic trees built with the single-copy nuclear gene CDS for <italic>Macadamia</italic> species strongly supported four distinct species in the genus <italic>Macadamia</italic> as reported in previous studies (<xref ref-type="bibr" rid="B35">Peace, 2005</xref>; <xref ref-type="bibr" rid="B29">Nock, 2022</xref>). Individual nuclear phylogenetic trees for the four species showed little structure, suggesting widespread gene flow within each species and little geographic structure in the nuclear genome. The SNPs based phylogeny also showed four distinct species in the genus <italic>Macadamia</italic>.</p>
<p>The availability of large sequence data has significantly advanced our understanding of the distribution and diversity of <italic>Macadamia</italic> species, which is essential for both conservation and breeding programs. This advanced knowledge aids in the conservation of these species, now found in fragmented rainforest habitats, by highlighting the importance of <italic>in situ</italic> conservation strategies that focus on capturing a wide range of genetic diversity within sites. Such conservation efforts are crucial not only for safeguarding the species against extinction but also in enhancing their commercial value and sustainability for the future generations.</p>
</sec>
</body>
<back>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>All sequence data available at NCBI via Bio Project: PRJNA1036028 with Bio sample number SAMN38356272 - SAMN38356438 (<xref ref-type="supplementary-material" rid="ST8">
<bold>Supplementary Table&#xa0;8</bold>
</xref>).</p>
</sec>
<sec id="s6" sec-type="author-contributions">
<title>Author contributions</title>
<p>SM: Formal analysis, Methodology, Writing &#x2013; original draft. AF: Conceptualization, Project administration, Supervision, Methodology, Formal analysis, Resources, Data curation, Writing &#x2013; review &amp; editing. BT: Conceptualization, Project administration, Supervision, Methodology, Data curation, Writing &#x2013; review &amp; editing. MA: Conceptualization, Supervision, Methodology, Data curation, Writing &#x2013; review &amp; editing. PM: Methodology, Writing &#x2013; review &amp; editing. AK-M: Methodology, Software, Writing &#x2013; review &amp; editing. RH: Conceptualization, Project administration, Funding acquisition, Supervision, Methodology, Formal analysis, Resources, Data curation, Writing &#x2013; review &amp; editing.</p>
</sec>
<sec id="s7" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research, authorship, and/or publication of this article. This work was supported by the Hort Frontiers Advanced Production Systems Fund as part of the Hort Frontiers strategic partnership initiative developed by Hort Innovation, with co-investment from The University of Queensland, and contributions from the Australian Government and BGI Australia. RH was supported by the ARC Centre of Excellence for Plant Success in Nature and Agriculture (CE200100015).</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>We gratefully acknowledge Aeyohan Furtado for developing the Python script to reconstruct coding sequences (CDS) from SNP data and the University of Queensland Research Computing Centre (UQ-RCC) for providing all the computation resources. We would like to thank Dr. Catherine J Nock for providing helpful comments on phylogenetic analysis and Denise Bond from Macadamia Conservation Trust for generously sharing data.</p>
</ack>
<sec id="s8" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s9" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2024.1394244/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2024.1394244/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
<supplementary-material xlink:href="DataSheet2.docx" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
<supplementary-material xlink:href="DataSheet3.docx" id="SM3" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
<supplementary-material xlink:href="Table1.xlsx" id="ST1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table2.xlsx" id="ST2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table3.xlsx" id="ST3" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table4.xlsx" id="ST4" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table5.xlsx" id="ST5" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table6.xlsx" id="ST6" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table7.xlsx" id="ST7" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table8.xlsx" id="ST8" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Acosta</surname> <given-names>M. C.</given-names>
</name>
<name>
<surname>Premoli</surname> <given-names>A. C.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Evidence of chloroplast capture in South American Nothofagus (subgenus Nothofagus, Nothofagaceae)</article-title>. <source>Mol. Phylogenet Evol.</source> <volume>54</volume>, <fpage>235</fpage>&#x2013;<lpage>242</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ympev.2009.08.008</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ahmad Termizi</surname> <given-names>A. A.</given-names>
</name>
<name>
<surname>Hardner</surname> <given-names>C. M.</given-names>
</name>
<name>
<surname>Batley</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Nock</surname> <given-names>C. J.</given-names>
</name>
<name>
<surname>Hayashi</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Montenegro</surname> <given-names>J. D.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>SNP analysis ofMacadamia integrifoliachloroplast genomes to determine the genetic structure of wild populations</article-title>. <source>Acta Hortic.</source> <volume>1109)</volume>, <fpage>175</fpage>&#x2013;<lpage>180</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.17660/ActaHortic.2016.1109.29</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alam</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Neal</surname> <given-names>J.</given-names>
</name>
<name>
<surname>O'Connor</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Kilian</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Topp</surname> <given-names>B.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Ultra-high-throughput DArTseq-based silicoDArT and SNP markers for genomic studies in macadamia</article-title>. <source>PLoS One.</source> <volume>13</volume>, <elocation-id>e0203465</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0203465</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ananda</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Norton</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Blomstedt</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Furtado</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Moller</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Gleadow</surname> <given-names>R.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Phylogenetic relationships in the Sorghum genus based on sequencing of the chloroplast and nuclear genes</article-title>. <source>Plant Genome</source>, <elocation-id>e20123</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/tpg2.20123</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Aradhya</surname> <given-names>M. K.</given-names>
</name>
<name>
<surname>Yee</surname> <given-names>L. K.</given-names>
</name>
<name>
<surname>Zee</surname> <given-names>F. T.</given-names>
</name>
<name>
<surname>Manshardt</surname> <given-names>R. M.</given-names>
</name>
</person-group> (<year>1998</year>). <article-title>Genetic variability in macadamia</article-title>. <source>Genet. Resour. Crop Evol.</source> <volume>45</volume>, <fpage>19</fpage>&#x2013;<lpage>32</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1023/A:1008634103954</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>De Las Rivas</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Lozano</surname> <given-names>J. J.</given-names>
</name>
<name>
<surname>Ortiz</surname> <given-names>A. R.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Comparative analysis of chloroplast genomes: functional annotation, genome-based phylogeny, and deduced evolutionary patterns</article-title>. <source>Genome Res.</source> <volume>12</volume>, <fpage>567</fpage>&#x2013;<lpage>583</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/gr.209402</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dobrogojski</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Adamiec</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Luci&#x144;ski</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>The chloroplast genome: a review</article-title>. <source>Acta Physiologiae Plantarum.</source> <volume>42</volume>, <fpage>98</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11738-020-03089-x</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Furtado</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>DNA extraction from vegetative tissue for next-generation sequencing</article-title>. <source>Methods Mol. Biol.</source> <volume>1099</volume>, <fpage>1</fpage>&#x2013;<lpage>5</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-1-62703-715-0_1</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Hardner</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Pisanu</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Boyton</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2004</year>). <source>National Macadamia Germplasm Conservation Program.</source> (<publisher-loc>Horticulture Australia</publisher-loc>: <publisher-name>CSIRO Plant Industry, Queensland Bioscience Precinct</publisher-name>).</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hardner</surname> <given-names>C. M.</given-names>
</name>
<name>
<surname>Peace</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Lowe</surname> <given-names>A. J.</given-names>
</name>
<name>
<surname>Neal</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Pisanu</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Powell</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2009</year>). <article-title>Genetic resources and domestication of macadamia</article-title>. <source>Hortic. Rev.</source> <volume>35</volume>, <fpage>1</fpage>&#x2013;<lpage>25</lpage>.</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hatmaker</surname> <given-names>E. A.</given-names>
</name>
<name>
<surname>Staton</surname> <given-names>M. E.</given-names>
</name>
<name>
<surname>Dattilo</surname> <given-names>A. J.</given-names>
</name>
<name>
<surname>Hadziabdic</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Rinehart</surname> <given-names>T. A.</given-names>
</name>
<name>
<surname>Schilling</surname> <given-names>E. E.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Population structure and genetic diversity within the endangered species pityopsis ruthii (Asteraceae)</article-title>. <source>Front. Plant Sci.</source> <volume>9</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2018.00943</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jansen</surname> <given-names>R. K.</given-names>
</name>
<name>
<surname>Kaittanis</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Saski</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>S. B.</given-names>
</name>
<name>
<surname>Tomkins</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Alverson</surname> <given-names>A. J.</given-names>
</name>
<etal/>
</person-group>. (<year>2006</year>). <article-title>Phylogenetic analyses of Vitis (Vitaceae) based on complete chloroplast genome sequences: effects of taxon sampling and phylogenetic methods on resolving relationships among rosids</article-title>. <source>BMC Evol. Biol.</source> <volume>6</volume>, <elocation-id>32</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2148-6-32</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Jansen</surname> <given-names>R. K.</given-names>
</name>
<name>
<surname>Raubeson</surname> <given-names>L. A.</given-names>
</name>
<name>
<surname>Boore</surname> <given-names>J. L.</given-names>
</name>
<name>
<surname>dePamphilis</surname> <given-names>C. W.</given-names>
</name>
<name>
<surname>Chumley</surname> <given-names>T. W.</given-names>
</name>
<name>
<surname>Haberle</surname> <given-names>R. C.</given-names>
</name>
<etal/>
</person-group>. (<year>2005</year>). &#x201c;<article-title>Methods for obtaining and analyzing whole chloroplast genome sequences</article-title>,&#x201d; in <source>Molecular Evolution: Producing the Biochemical Data</source>. <publisher-name>University of Texas, Austin</publisher-name>, <fpage>348</fpage>&#x2013;<lpage>384</lpage>.</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jin</surname> <given-names>J. J.</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>W. B.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>J. B.</given-names>
</name>
<name>
<surname>Song</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>dePamphilis</surname> <given-names>C. W.</given-names>
</name>
<name>
<surname>Yi</surname> <given-names>T. S.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>GetOrganelle: a fast and versatile toolkit for accurate <italic>de novo</italic> assembly of organelle genomes</article-title>. <source>Genome Biol.</source> <volume>21</volume>, <fpage>241</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13059-020-02154-5</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kawabe</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Nukii</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Furihata</surname> <given-names>H. Y.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Exploring the history of chloroplast capture in arabis using whole chloroplast genome sequencing</article-title>. <source>Int. J. Mol. Sci.</source> <volume>19</volume>, <fpage>602</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/ijms19020602</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kyriakidou</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Tai</surname> <given-names>H. H.</given-names>
</name>
<name>
<surname>Anglin</surname> <given-names>N. L.</given-names>
</name>
<name>
<surname>Ellis</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Stromvik</surname> <given-names>M. V.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Current strategies of polyploid plant genome sequence assembly</article-title>. <source>Front. Plant Sci.</source> <volume>9</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2018.01660</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lan</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Yin</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>W.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Comparative and phylogenetic analysis of complete chloroplast genomes from five Artemisia species</article-title>. <source>Front. Plant Sci.</source> <volume>13</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2022.1049209</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Letunic</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Bork</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Interactive Tree Of Life (iTOL) v5: an online tool for phylogenetic tree display and annotation</article-title>. <source>Nucleic Acids Res.</source> <volume>49</volume>, <fpage>W293</fpage>&#x2013;<lpage>W296</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkab301</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>de la Torre</surname> <given-names>A. R.</given-names>
</name>
<name>
<surname>Sterck</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Canovas</surname> <given-names>F. M.</given-names>
</name>
<name>
<surname>Avila</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Merino</surname> <given-names>I.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Single-copy genes as molecular markers for phylogenomic studies in seed plants</article-title>. <source>Genome Biol. Evol.</source> <volume>9</volume>, <fpage>1130</fpage>&#x2013;<lpage>1147</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gbe/evx070</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lin</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Signatures of selection in recently domesticated macadamia</article-title>. <source>Nat. Commun.</source> <volume>13</volume>, <fpage>242</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41467-021-27937-7</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>G.-Q.</given-names>
</name>
<name>
<surname>Lian</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>The molecular phylogeny of land plants: progress and future prospects</article-title>. <source>Diversity.</source> <volume>14</volume>, <elocation-id>782</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/d14100782</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Niu</surname> <given-names>Y. F.</given-names>
</name>
<name>
<surname>Ni</surname> <given-names>S. B.</given-names>
</name>
<name>
<surname>He</surname> <given-names>X. Y.</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Complete chloroplast genome of a subtropical fruit tree Macadamia ternifolia (Proteaceae)</article-title>. <source>Mitochondrial DNA B Resour.</source> <volume>2</volume>, <fpage>738</fpage>&#x2013;<lpage>739</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/23802359.2017.1390401</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Niu</surname> <given-names>Y. F.</given-names>
</name>
<name>
<surname>Ni</surname> <given-names>S. B.</given-names>
</name>
<name>
<surname>He</surname> <given-names>X. Y.</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Z. Y.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>The whole chloroplast genome sequence of Macadamia tetraphylla (Proteaceae)</article-title>. <source>Mitochondrial DNA B Resour.</source> <volume>3</volume>, <fpage>1276</fpage>&#x2013;<lpage>1277</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/23802359.2018.1532836</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mai</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Alam</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Hardner</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Henry</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Topp</surname> <given-names>B.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Genetic structure of wild germplasm of macadamia: species assignment, diversity and phylogeographic relationships</article-title>. <source>Plants (Basel).</source> <volume>9</volume>, <elocation-id>714</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/plants9060714</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mast</surname> <given-names>A. R.</given-names>
</name>
<name>
<surname>Willis</surname> <given-names>C. L.</given-names>
</name>
<name>
<surname>Jones</surname> <given-names>E. H.</given-names>
</name>
<name>
<surname>Downs</surname> <given-names>K. M.</given-names>
</name>
<name>
<surname>Weston</surname> <given-names>P. H.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>A smaller Macadamia from a more vagile tribe: inference of phylogenetic relationships, divergence times, and diaspore evolution in Macadamia and relatives (tribe Macadamieae; Proteaceae)</article-title>. <source>Am. J. Bot.</source> <volume>95</volume>, <fpage>843</fpage>&#x2013;<lpage>870</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3732/ajb.0700006</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Miller</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Pfeiffer</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Schwartz</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2010</year>). &#x201c;<article-title>Creating the CIPRES Science Gateway for inference of large phylogenetic trees</article-title>&#x201d;, in<source> 2010 gateway computing environments workshop (GCE)</source>, p. <fpage>1</fpage>-<lpage>8</lpage>.</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moner</surname> <given-names>A. M.</given-names>
</name>
<name>
<surname>Furtado</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Henry</surname> <given-names>R. J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Two divergent chloroplast genome sequence clades captured in the domesticated rice gene pool may have significance for rice production</article-title>. <source>BMC Plant Biol.</source> <volume>20</volume>, <fpage>472</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12870-020-02689-6</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nge</surname> <given-names>F. J.</given-names>
</name>
<name>
<surname>Biffin</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Thiele</surname> <given-names>K. R.</given-names>
</name>
<name>
<surname>Waycott</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Reticulate evolution, ancient chloroplast haplotypes, and rapid radiation of the Australian plant genus adenanthos (Proteaceae)</article-title>. <source>Front. Ecol. Evol.</source> <volume>8</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fevo.2020.616741</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Nock</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2022</year>). <source>Genetic diversity and population structure of wild and domesticated macadamia</source>.</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nock</surname> <given-names>C. J.</given-names>
</name>
<name>
<surname>Baten</surname> <given-names>A.</given-names>
</name>
<name>
<surname>King</surname> <given-names>G. J.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Complete chloroplast genome of Macadamia integrifoliaconfirms the position of the Gondwanan early-diverging eudicot family Proteaceae</article-title>. <source>BMC Genomics.</source> <volume>15</volume>, <fpage>S13</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2164-15-s9-s13</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nock</surname> <given-names>C. J.</given-names>
</name>
<name>
<surname>Baten</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Mauleon</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Langdon</surname> <given-names>K. S.</given-names>
</name>
<name>
<surname>Topp</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Hardner</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Chromosome-scale assembly and annotation of the macadamia genome (Macadamia integrifolia HAES 741)</article-title>. <source>G3 (Bethesda).</source> <volume>10</volume>, <fpage>3497</fpage>&#x2013;<lpage>3504</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1534/g3.120.401326</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nock</surname> <given-names>C. J.</given-names>
</name>
<name>
<surname>Hardner</surname> <given-names>C. M.</given-names>
</name>
<name>
<surname>Montenegro</surname> <given-names>J. D.</given-names>
</name>
<name>
<surname>Ahmad Termizi</surname> <given-names>A. A.</given-names>
</name>
<name>
<surname>Hayashi</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Playford</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Wild origins of macadamia domestication identified through intraspecific chloroplast genome sequencing</article-title>. <source>Front. Plant Sci.</source> <volume>10</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2019.00334</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>O'Connor</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Powell</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Nock</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Shapcott</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Crop to wild gene flow and genetic diversity in a vulnerable Macadamia (Proteaceae) species in New South Wales, Australia</article-title>. <source>Biol. Conserv.</source> <volume>191</volume>, <fpage>504</fpage>&#x2013;<lpage>511</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.biocon.2015.08.001</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>O&#x2019;Connor</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Kilian</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Hayes</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Hardner</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Nock</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Baten</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Population structure, genetic diversity and linkage disequilibrium in a macadamia breeding population using SNP and silicoDArT markers</article-title>. <source>Tree Genet. Genomes.</source> <volume>15</volume>, <fpage>1</fpage>-<lpage>6</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11295-019-1331-z</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Peace</surname> <given-names>C. P.</given-names>
</name>
</person-group> (<year>2005</year>). <source>Genetic characterisation of Macadamia with DNA markers.</source> (<publisher-loc>Australia</publisher-loc>: <publisher-name>The University of Queensland, School of Molecular and Microbial Sciences</publisher-name>).</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rieseberg</surname> <given-names>L. H.</given-names>
</name>
<name>
<surname>Soltis</surname> <given-names>D. E.</given-names>
</name>
</person-group> (<year>1991</year>). <article-title>Phylogenetic consequences of cytoplasmic gene flow in plants</article-title>. <source>Zurich Switzerland: Evolutionary Trends Plants.</source>  <volume>5</volume>, <fpage>65</fpage>-<lpage>84</lpage>.</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ronquist</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Teslenko</surname> <given-names>M.</given-names>
</name>
<name>
<surname>van der Mark</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Ayres</surname> <given-names>D. L.</given-names>
</name>
<name>
<surname>Darling</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Hohna</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2012</year>). <article-title>MrBayes 3.2: efficient Bayesian phylogenetic inference and model choice across a large model space</article-title>. <source>Syst. Biol.</source> <volume>61</volume>, <fpage>539</fpage>&#x2013;<lpage>542</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/sysbio/sys029</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sharma</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Masouleh</surname> <given-names>A. K.</given-names>
</name>
<name>
<surname>Constantin</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Topp</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Furtado</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Henry</surname> <given-names>R. J.</given-names>
</name>
</person-group> (<year>2023</year>). <source>The genomes of the Macadamia genus</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/2023.12.07.570730</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stamatakis</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>RAxML version 8: a tool for phylogenetic analysis and post-analysis of large phylogenies</article-title>. <source>Bioinformatics.</source> <volume>30</volume>, <fpage>1312</fpage>&#x2013;<lpage>1313</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btu033</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Yuan</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>L.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Evolutionary and phylogenetic aspects of the chloroplast genome of Chaenomeles species</article-title>. <source>Sci. Rep.</source> <volume>10</volume>, <fpage>11466</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-020-67943-1</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Swofford</surname> <given-names>D. L.</given-names>
</name>
<name>
<surname>Sullivan</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2003</year>). &#x201c;<article-title>Phylogeny inference based on parsimony and other methods using PAUP*</article-title>&#x201d;, in <source>The phylogenetic handbook: a practical approach to DNA and protein phylogeny.</source> <volume>7</volume>, pp.<fpage>160</fpage>-<lpage>206</lpage>. </citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tanksley</surname> <given-names>S. D.</given-names>
</name>
<name>
<surname>McCouch</surname> <given-names>S. R.</given-names>
</name>
</person-group> (<year>1997</year>). <article-title>Seed banks and molecular maps: unlocking genetic potential from the wild</article-title>. <source>Science.</source> <volume>277</volume>, <fpage>1063</fpage>&#x2013;<lpage>1066</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.277.5329.1063</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tillich</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Lehwark</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Pellizzer</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Ulbricht-Jones</surname> <given-names>E. S.</given-names>
</name>
<name>
<surname>Fischer</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Bock</surname> <given-names>R.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>). GeSeq - versatile and accurate annotation of organelle genomes</article-title>. <source>Nucleic Acids Res.</source> <volume>45</volume>, <fpage>W6</fpage>&#x2013;<lpage>W11</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkx391</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Topp</surname> <given-names>B. L.</given-names>
</name>
<name>
<surname>Nock</surname> <given-names>C. J.</given-names>
</name>
<name>
<surname>Hardner</surname> <given-names>C. M.</given-names>
</name>
<name>
<surname>Alam</surname> <given-names>M.</given-names>
</name>
<name>
<surname>O&#x2019;Connor</surname> <given-names>K. M.</given-names>
</name>
</person-group> (<year>2019</year>). &#x201c;<article-title>Macadamia (Macadamia spp.) breeding</article-title>,&#x201d; in <source>Advances in plant breeding strategies: Nut and beverage crops.</source> <volume>4</volume>, <fpage>221</fpage>&#x2013;<lpage>251</lpage>.</citation>
</ref>
<ref id="B45">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Walton</surname> <given-names>H.M.W.A.D.A.</given-names>
</name>
</person-group> (<year>2011</year>). &#x201c;<article-title>Macadamia (Macadamia integrifolia, Macadamia tetraphylla and hybrids)</article-title>,&#x201d; in <source>Postharvest Biology and Technology of Tropical and Subtropical Fruits: Cocona to Mango</source>. Ed. <person-group person-group-type="editor">
<name>
<surname>Yahia</surname> <given-names>E. M.</given-names>
</name>
</person-group> (<publisher-loc>Cambridge, England</publisher-loc>: <publisher-name>Woodhead Publishing Limited</publisher-name>), <fpage>450</fpage>&#x2013;<lpage>474</lpage>.</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wambugu</surname> <given-names>P. W.</given-names>
</name>
<name>
<surname>Brozynska</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Furtado</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Waters</surname> <given-names>D. L.</given-names>
</name>
<name>
<surname>Henry</surname> <given-names>R. J.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Relationships of wild and domesticated rices (Oryza AA genome species) based upon whole chloroplast genome sequences</article-title>. <source>Sci. Rep.</source> <volume>5</volume>, <elocation-id>13957</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/srep13957</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wyman</surname> <given-names>S. K.</given-names>
</name>
<name>
<surname>Jansen</surname> <given-names>R. K.</given-names>
</name>
<name>
<surname>Boore</surname> <given-names>J. L.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Automatic annotation of organellar genomes with DOGMA</article-title>. <source>Bioinformatics.</source> <volume>20</volume>, <fpage>3252</fpage>&#x2013;<lpage>3255</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bth352</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yanfei</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Tai</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Chunhua</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Jia</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Fazhong</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Complete chloroplast genome sequences of the medicinal plant Aconitum transsectum (Ranunculaceae): comparative analysis and phylogenetic relationships</article-title>. <source>BMC Genomics.</source> <volume>24</volume>, <fpage>90</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12864-023-09180-0</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yi</surname> <given-names>T. S.</given-names>
</name>
<name>
<surname>Jin</surname> <given-names>G. H.</given-names>
</name>
<name>
<surname>Wen</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Chloroplast capture and intra- and inter-continental biogeographic diversification in the Asian - New World disjunct plant genus Osmorhiza (Apiaceae)</article-title>. <source>Mol. Phylogenet Evol.</source> <volume>85</volume>, <fpage>10</fpage>&#x2013;<lpage>21</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ympev.2014.09.028</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Rabiee</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Sayyari</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Mirarab</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>ASTRAL-III: polynomial time species tree reconstruction from partially resolved gene trees</article-title>. <source>BMC Bioinformatics.</source> <volume>19</volume> (<supplement>Suppl 6</supplement>), <fpage>153</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12859-018-2129-y</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Batley</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Exploring the application of wild species for crop improvement in a changing climate</article-title>. <source>Curr. Opin. Plant Biol.</source> <volume>56</volume>, <fpage>218</fpage>&#x2013;<lpage>222</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.pbi.2019.12.013</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Ebrahimi</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Woeste</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>P.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Whole genome based insights into the phylogeny and evolution of the Juglandaceae</article-title>. <source>BMC Ecol. Evol.</source> <volume>21</volume>, <elocation-id>191</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12862-021-01917-3</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>