<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1375488</article-id>
<article-id pub-id-type="doi">10.3389/fgene.2024.1375488</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Mechanistic analysis of the hardening process of the thorns on stems of <italic>Bougainvillea glabra &#x201c;Elizabeth Angus&#x201d;</italic>
</article-title>
<alt-title alt-title-type="left-running-head">Sun et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fgene.2024.1375488">10.3389/fgene.2024.1375488</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Sun</surname>
<given-names>Lina</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Huaxin</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Jinhua</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Gong</surname>
<given-names>Jianying</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yang</surname>
<given-names>Shuting</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yang</surname>
<given-names>Kaitai</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Chen</surname>
<given-names>Er</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Bing</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Lu</surname>
<given-names>Zhixiang</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Chen</surname>
<given-names>Qi</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/512486/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Lin</surname>
<given-names>Mao</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2637860/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Guangxi Forestry Research Institute</institution>, <addr-line>Nanning</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>School of Agriculture and Biology, Shanghai Jiaotong University</institution>, <addr-line>Shanghai</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Nanning GoldTech Biotechnology Ltd.</institution>, <addr-line>Nanning</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/187350/overview">Andrey Grigoriev</ext-link>, Rutgers, The State University of New Jersey, United States</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1071003/overview">Xingyun Qi</ext-link>, Rutgers University Camden, United States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2727437/overview">Qiu Li-hang</ext-link>, Guangxi Academy of Agricultural Science, China</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Mao Lin, <email>49888178@qq.com</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>04</day>
<month>07</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>15</volume>
<elocation-id>1375488</elocation-id>
<history>
<date date-type="received">
<day>23</day>
<month>01</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>06</day>
<month>06</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Sun, Wang, Li, Gong, Yang, Yang, Chen, Li, Lu, Chen and Lin.</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Sun, Wang, Li, Gong, Yang, Yang, Chen, Li, Lu, Chen and Lin</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>
<bold>Introduction:</bold> <italic>Bougainvillea glabra</italic> &#x201c;<italic>Elizabeth Angus</italic>&#x201c; is a thorny woody vine or shrub. However, the hard thorns are considered a deficiency in its ornamental value.</p>
<p>
<bold>Methods:</bold> To find the genes and pathways related to the hardening process of the thorns on the stems of <italic>B. glabra</italic>, the eukaryotic unreferenced transcriptome sequencing analysis was conducted to explore the 3 stages of the thorn-hardening process. Total RNA was extracted from thorns and stems, and transcriptome libraries were constructed and sequenced using unreferenced Illumina sequencing.</p>
<p>
<bold>Results:</bold> Gene function annotation was performed using various databases, resulting in 8937 co-annotated genes. The density distribution of Fragments Per Kilobase of transcript per Million mapped reads (FPKM) depicted the overall gene expression patterns. The study found that stage 2 as the period of highest gene expression activity during the thorns hardening process in <italic>B. glabra</italic>. Differential expression analysis revealed that during thorn-hardening, 1045 genes up-regulated and 391 genes down-regulated significantly in thorns at stage 2 compared to stage 1 (early stage of thorns formation). Meanwhile, 938 genes up-regulated and 784 genes down-regulated significantly in stems. At stage 3, as thorns became harder, 63 genes exhibited notable expression increase and 98 genes&#x2019; expression decreased obviously within thorns, and 46 genes up-regulated and 29 genes down-regulated in stems, compared to stage 2. Phenylpropanoid biosynthesis was the key step in the hardening process of the thorns of <italic>B. glabra</italic>. The formation and hardening of thorns on the stem of <italic>B. glabra</italic> was a process in which lignin gradually accumulated in the thorns, and several genes were involved in this process. They include <italic>PAL</italic> (EC:4.3.1.24), <italic>CYP73A</italic> (EC:1.14.14.91), <italic>4CL</italic> (EC:6.2.1.12), <italic>CCR</italic> (EC:1.2.1.44), <italic>CAD</italic> (EC:1.1.1.195) and <italic>POX</italic> (EC:1.11.1.7).</p>
<p>
<bold>Discussion:</bold> This transcriptome analysis offers insights into the molecular mechanisms underlying thorns development in this plant species.</p>
</abstract>
<kwd-group>
<kwd>
<italic>Bougainvillea glabra &#x201c;Elizabeth Angus&#x201d;</italic>
</kwd>
<kwd>hardening of the thorns</kwd>
<kwd>transcriptome</kwd>
<kwd>phenylpropanoid biosynthesis</kwd>
<kwd>lignin</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>RNA</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>
<italic>Bougainvillea glabra &#x201c;Elizabeth Angus&#x201d;</italic> is an evergreen climbing shrub of Centrospermae (order), Nyctaginaceae (family) (<xref ref-type="bibr" rid="B14">Wu et al., 2003</xref>). It is originally from South America, including Brazil, Peru, Argentina&#x2019;s Chubut Province (<xref ref-type="bibr" rid="B11">Lim, 2014</xref>), Bolivia, Ecuador, and Paraguay (<xref ref-type="bibr" rid="B2">Bautista et al., 2022</xref>). <italic>Bougainvillea glabra</italic> is widely grown in tropical and subtropical regions in China, where it has been introduced and cultivated for over a century. Presently, in the tropical and subtropical regions of China, such as Guangdong, Hainan, Guangxi, Fujian, and Yunnan Province, <italic>B</italic>. <italic>glabra</italic> has been extensively cultivated demonstrating its adaptability, ease of cultivation, for its colorful flowers (<xref ref-type="bibr" rid="B16">Yanjing, 2010</xref>), within the realm of landscaping and ornamental horticulture.</p>
<p>
<italic>Bougainvillea glabra</italic> grows as a woody vine or shrub with thorny stems. In the early stage of formation, the thorns on the stems of <italic>B</italic>. <italic>glabra</italic> are green in color and soft in texture. After that, the color gradually deepens and eventually becomes dark brown, and the texture becomes very hard. Ornamental evaluation of <italic>B</italic>. <italic>glabra</italic> involves multiple target traits (<xref ref-type="bibr" rid="B13">Sun Lina et al., 2016</xref>), and the rigidity of the thorns on the stems could be considered a target trait. We focus our study on the hardening process of the thorns on the stems of <italic>B</italic>. <italic>glabra</italic> to identify the genes that regulate this process. According to previous studies, it is known that the mechanical strength of plant stems mainly depends on the formation of secondary cell walls. The secondary cell walls are composed mainly of cellulose, hemicellulose, and lignin (<xref ref-type="bibr" rid="B9">Kushwah et al., 2020</xref>). Lignin is essential for the mechanical support of plants, for example, lignin deposition is believed to play an important role in cotton fiber development. Another example is that the development of wood properties depends on the lignin deposition (<xref ref-type="bibr" rid="B1">Antonova et al., 2014</xref>). Based on these previous studies, it is hypothesized that the synthesis and deposition of cellulose and lignin are closely related to thorn formation in <italic>B</italic>. <italic>glabra</italic>. This research will provide a scientific basis for the cultivation of soft thorns or thorn-free <italic>B</italic>. <italic>glabra</italic> and would provide valuable insights into the developmental regulation of woody modifications in higher plants.</p>
<p>To search for genes and pathways related to the hardening process of <italic>B</italic>. <italic>glabra</italic> thorns, we conducted eukaryotic unreferenced transcriptome sequencing analysis because there is no complete genome information available for this plant species in existing online databases. Our study aims to provide a scientific basis for the cultivation of soft thorns or thorn-free <italic>B. glabra</italic> and to gain insights into the developmental regulation of woody modifications in higher plants.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>Materials and methods</title>
<sec id="s2-1">
<title>Plant material</title>
<p>
<italic>Bougainvillea glabra</italic> is grown (1 age of these trees) in Nanning, Guangxi Province in China. Three stages in the development of the thorns were identified <italic>viz.</italic>, as given in sample <xref ref-type="table" rid="T1">Table 1</xref> below; please refer to the table for a detailed description of the correct stages.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Sampling of thorns and stem from <italic>Bougainvillea glabra</italic> used for RNA isolation in triplicates.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Stage</th>
<th align="left">Thorn morphology/size/days</th>
<th align="left">Sample numbering</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Stage 1 thorns</td>
<td align="left">Young soft green/2&#x2013;4 mm/5 days (<xref ref-type="fig" rid="F1">Fig1B</xref>)</td>
<td align="left">C1&#x2013;1; C1&#x2013;2; C1&#x2013;3</td>
</tr>
<tr>
<td align="left">Stage 2 thorns</td>
<td align="left">Young green but hard/5&#x2013;6 mm/25 days (<xref ref-type="fig" rid="F1">Fig1C</xref>)</td>
<td align="left">C2&#x2013;1; C2&#x2013;2; C2&#x2013;3</td>
</tr>
<tr>
<td align="left">Stage 3 thorns</td>
<td align="left">Mature greenish brown hard/7&#x2013;8 mm/35 days (<xref ref-type="fig" rid="F1">Fig1D</xref>)</td>
<td align="left">C3&#x2013;1; C3&#x2013;2; C3&#x2013;3</td>
</tr>
<tr>
<td align="left">Stage 1 stems</td>
<td align="left">Young green stems</td>
<td align="left">J1&#x2013;1; J1&#x2013;2; J1&#x2013;3</td>
</tr>
<tr>
<td align="left">Stage 2 stems</td>
<td align="left">Young green stems but hard</td>
<td align="left">J2&#x2013;1; J2&#x2013;2; J2&#x2013;3</td>
</tr>
<tr>
<td align="left">Stage 3 stems</td>
<td align="left">Mature hard brown stems</td>
<td align="left">J3&#x2013;1; J3&#x2013;2; J3&#x2013;3</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>In different stages of thorn formation on the stems, the thorns and stems of <italic>B</italic>. <italic>glabra</italic> were collected for transcriptome analysis. The three stages for analysis include the early stage of thorn formation, the stage in which thorns were hardened, and the stage that is between them. Triplicate samples for each stage were included.</p>
</sec>
<sec id="s2-2">
<title>Transcriptome analysis</title>
<sec id="s2-2-1">
<title>Library preparation for transcriptome sequencing</title>
<p>A total amount of 1.5&#xa0;&#x3bc;g RNA per sample was used as an input material for the RNA sample preparations. Sequencing libraries were generated using the NEBNext<sup>&#xae;</sup> Ultra&#x2122; RNA Library Prep Kit for Illumina<sup>&#xae;</sup> (NEB, United States), following the manufacturer&#x2019;s recommendations, and index codes were added to attribute sequences to each sample. In brief, mRNA was purified from total RNA using poly-T oligo-attached magnetic beads. Fragmentation was carried out using divalent cations under elevated temperature in NEBNext First Strand Synthesis Reaction Buffer (5X). First-strand cDNA was synthesized using a random hexamer primer and M-MuLV Reverse Transcriptase (RNase H). Second-strand cDNA synthesis was subsequently performed using DNA polymerase I and RNase H. Remaining overhangs were converted into blunt ends <italic>via</italic> exonuclease/polymerase activities. After adenylation of 3&#x2032; ends of DNA fragments, NEBNext Adaptor with a hairpin loop structure was ligated to prepare for hybridization. To select cDNA fragments of preferentially 150&#x2013;200 bp in length, the library fragments were purified using the AMPure XP system (Beckman Coulter, Beverly, United States). Then, 3&#xa0;&#x3bc;L USER Enzyme (NEB, United States) was used with size-selected, adaptor-ligated cDNA at 37&#xb0;C for 15&#xa0;min, followed by 5&#xa0;min at 95&#xb0;C before PCR. Then, PCR was performed with Phusion High-Fidelity DNA polymerase, universal PCR primers, and index (X) primer. At last, PCR products were purified (AMPure XP system), and library quality was assessed on the Agilent Bioanalyzer 2100 system.</p>
</sec>
</sec>
<sec id="s2-3">
<title>Clustering and sequencing</title>
<p>The clustering of the index-coded samples was performed on a cBot Cluster Generation System using TruSeq PE Cluster Kit v3-cBot-HS (Illumina), according to the manufacturer&#x2019;s instructions. After cluster generation, the library preparations were sequenced on an Illumina HiSeq platform, and paired-end reads were generated.</p>
</sec>
<sec id="s2-4">
<title>Data analysis</title>
<p>Raw data (raw reads) of fastq format were first processed through in-house perl scripts. In this step, clean data (clean reads) were obtained by removing reads containing the adapter, reads containing ploy-N, and reads whose quality was low from raw data. At the same time, Q20, Q30, and GC content of the clean data were calculated. All the downstream analyses were based on clean data with high quality.</p>
<p>The left ends (read1 files) of fastq format were pooled into one big left.fq file, and the right end (read2 files), into one big right.fq file. The transcriptome assembly was accomplished based on left.fq and right.fq using Trinity (<xref ref-type="bibr" rid="B5">Grabherr et al., 2011</xref>) with min kmer cov set to 2 by default and all other parameters set to default. The assembled transcripts were hierarchically clustered to unigenes using shared reads and expressions by Corset (<xref ref-type="bibr" rid="B4">Davidson and Oshlack, 2014</xref>).</p>
<p>The correlation of gene expression levels between samples is a crucial indicator to test the reliability of an experiment and to check whether the sample selection is reasonable. It is essential to check the correlation of gene expression levels between samples before performing differential expression analysis. The Pearson correlation coefficient represents the correlation of gene expression levels between samples. The closer the correlation coefficient is to 1, the higher the similarity of expression patterns between samples. A correlation coefficient between 0.8 and 1 indicates a very strong correlation. If the correlation coefficient between samples of biological repeats is lower than 0.8, it means that the samples&#x2019; correlation is low. The correlation between pairwise comparisons of the three biological replicates at the same site in the same period is above 0.8, indicating that their respective gene expression levels are similar.</p>
<p>Gene function was annotated based on the NCBI non-redundant protein and nucleotide sequences. Gene function was also annotated by the Pfam (protein family), KOG/COG (clusters of orthologous groups of proteins), Swiss-Prot (a manually annotated and reviewed protein sequence database), KEGG Ortholog database (<xref ref-type="bibr" rid="B8">Kanehisa and Goto, 2000</xref>), and Gene Ontology (GO).</p>
</sec>
<sec id="s2-5">
<title>SNP calling</title>
<p>Picard-tools v1.41 and samtools v0.1.18 were used to sort, remove duplicated reads, and merge the bam alignment results of each sample. GATK3 software was used to perform SNP calling. Raw vcf files were filtered using the GATK standard filter method and other parameters (cluster: 3; window size: 35; QD &#x3c; 2.0 or FS &#x3e; 60.0 or MQ &#x3c; 40.0 or SOR &#x3e;4.0 or MQRankSum &#x3c; &#x2212;12.5 or ReadPosRankSum &#x3c; &#x2212;8.0 or DP &#x3c; 10).</p>
</sec>
<sec id="s2-6">
<title>SSR detection and primer design</title>
<p>SSR of the transcriptome was identified using MISA (<ext-link ext-link-type="uri" xlink:href="http://pgrc.ipk-gatersleben.de/misa/misa.html">http://pgrc.ipk-gatersleben.de/misa/misa.html</ext-link>), and the primer for each SSR was designed using Primer3 (<ext-link ext-link-type="uri" xlink:href="http://primer3.sourceforge.net/releases.php">http://primer3.sourceforge.net/releases.php</ext-link>). Quantification of gene expression levels was estimated by RSEM (<xref ref-type="bibr" rid="B10">Li and Dewey, 2011</xref>) for each sample: 1. clean data were mapped back onto the assembled transcriptome; 2. read count for each gene was obtained from the mapping results.</p>
</sec>
<sec id="s2-7">
<title>Differential expression analysis</title>
<p>Differential expression analysis of two conditions/groups (two biological replicates per condition) was performed using the Differential Expression Sequence (DESeq) R package (1.18.0). DESeq provides statistical routines for determining differential expression in digital gene expression data using a model based on the negative binomial distribution. The resulting <italic>p</italic>-values were adjusted using the Benjamini and Hochberg&#x2019;s approach for controlling the false discovery rate. Genes with an adjusted <italic>p</italic>-value &#x3c;0.05 found by DESeq were assigned as differentially expressed.</p>
<p>Prior to differential gene expression analysis, for each sequenced library, the read counts were adjusted using the edgeR program package through one scaling normalized factor. Differential expression analysis of two conditions was performed using the DEGSeq R package (1.20.0). The <italic>p</italic>-values were adjusted using the Benjamini and Hochberg method. A corrected <italic>p</italic>-value of 0.005 and log2 (fold change) of 1 were set as the threshold for significantly differential expression.</p>
</sec>
<sec id="s2-8">
<title>GO and KEGG enrichment analyses of differentially expressed genes</title>
<p>GO enrichment analysis of differentially expressed genes (DEGs) was implemented using the GOseq R package, in which the gene length bias was corrected. GO terms with a corrected <italic>p</italic>-value of less than 0.05 were considered significantly enriched by DEGs. KEGG is a database resource for understanding high-level functions and utilities of the biological system, such as the cell, the organism, and the ecosystem, from molecular-level information, especially large-scale molecular datasets generated by genome sequencing and other high-throughput experimental technologies (<ext-link ext-link-type="uri" xlink:href="http://www.genome.jp/kegg/">http://www.genome.jp/kegg/</ext-link>) (<xref ref-type="bibr" rid="B7">Kanehisa, 2019</xref>). We used KOBAS software to test the statistical enrichment of differential expression genes in KEGG pathways.</p>
</sec>
<sec id="s2-9">
<title>PPI analysis of differentially expressed genes</title>
<p>Protein&#x2013;protein interaction (PPI) analysis of DEGs was based on the STRING database, with known and predicted PPIs. For the species existing in the database, we constructed the networks by extracting the target gene list from the database. Otherwise, Blastx (v2.2.28) was used to align the target gene sequences to the selected reference protein sequences, and then, the networks were built according to the known interaction of selected reference species.</p>
</sec>
<sec id="s2-10">
<title>Transcription factor analysis</title>
<p>Transcription factor (TF) prediction is done using iTAK software, the basic principle of which is to identify TFs by hmmscan using the categorized and defined TF (transcription factor) family and rules in the database.</p>
</sec>
<sec id="s2-11">
<title>RT-qPCR verification</title>
<p>Expression profiling of six genes of the phenylpropanoid pathway was carried out using the reverse transcription fluorogenic quantitative polymerase chain reaction (RT-qPCR). The total RNA from thorns and stems of <italic>B</italic>. <italic>glabra</italic> at three stages was extracted using the HiPure HP Plant RNA Mini Kit (Magen Biotechnology Co., Ltd, R4165-02). cDNA was reverse-transcribed from mRNA using HiScript II Q RT SuperMix for qPCR (&#x2b;gDNA wiper) (Vazyme Biotech Co., Ltd, R223-01). cDNA and ChamQ Universal SYBR qPCR Master Mix (Vazyme Biotech Co., Ltd, Q711-02) were used for qPCR. Real-time quantitative PCR analysis was conducted using the qTOWER3 system (AnalytikJena, German). The primers used in RT-qPCR are provided in <xref ref-type="sec" rid="s11">Supplementary Table S1</xref>.</p>
</sec>
<sec id="s2-12">
<title>Determination of the lignin content</title>
<p>The samples were dried at 80&#xb0;C until they reached a constant weight, pulverized, passed through a 40-mesh sieve, and weighed for a certain amount (denoted as W). Acetylation of phenolic hydroxyl groups of lignin in samples was performed. Following the acetylation of phenolic hydroxyl groups within lignin, a discernible absorption peak at 280&#xa0;nm became evident. Notably, the absorbance measurement at 280&#xa0;nm exhibited a direct positive correlation with the lignin content present. In this study, the lignin content was characterized by the absorbance value at 280&#xa0;nm. The formula for converting 280&#xa0;nm absorbance to lignin content is as follows: Lignin (mg/g) &#x3d; (&#x394;A-0.0068)&#xf7;0.0347&#xd7;V&#xd7;10&#x2013;3&#xf7;W&#xd7;T &#x3d; 0.0294&#xd7;(&#x394;A-0.0068) &#xf7;0.002 &#xd7; 50. (V, total volume of the reaction; W, sample quality (dry weight); T, dilution factor; A, measurement of absorbance at 280nm; &#x394;A, measurement of absorbance at 280&#xa0;nm of the sample and absorbance value at 280&#xa0;nm for blank control).</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<sec id="s3-1">
<title>Overview of transcriptome analysis</title>
<p>For research purposes, the plants of <italic>B</italic>. <italic>glabra</italic> were selected at three different stages, ranging from thorn formation (stage 1) to thorn hardening (stage 2 to stage 3), as shown in <xref ref-type="fig" rid="F1">Figure 1</xref>. We extracted the total RNA from both thorns and stems and constructed transcriptome libraries for each stage using three biological triplicates of samples. We sequenced the libraries using the Illumina platform and obtained raw reads ranging from 41,266,290 to 49987188 from 18 libraries. The base calling accuracy of more than 99.9% (Q30(%)) for each treatment was over 90%, as shown in <xref ref-type="table" rid="T2">Table 2</xref>.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Flowering plants of <italic>B</italic>. <italic>glabra</italic> and the three stages of thorn formation used for the study.</p>
</caption>
<graphic xlink:href="fgene-15-1375488-g001.tif"/>
</fig>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>List of data output quality.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Sample</th>
<th align="center">Raw reads</th>
<th align="center">Clean reads</th>
<th align="center">Error (%)</th>
<th align="center">Q20 (%)</th>
<th align="center">Q30 (%)</th>
<th align="center">GC content (%)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">C1_1</td>
<td align="center">46997486</td>
<td align="center">46652954</td>
<td align="center">0.03</td>
<td align="center">97.38</td>
<td align="center">93.08</td>
<td align="center">43.9</td>
</tr>
<tr>
<td align="center">C1_2</td>
<td align="center">49987188</td>
<td align="center">49659918</td>
<td align="center">0.03</td>
<td align="center">97.39</td>
<td align="center">93.05</td>
<td align="center">44.64</td>
</tr>
<tr>
<td align="center">C1_3</td>
<td align="center">47513884</td>
<td align="center">4,7221972</td>
<td align="center">0.03</td>
<td align="center">97.38</td>
<td align="center">93.01</td>
<td align="center">44.68</td>
</tr>
<tr>
<td align="center">C2_1</td>
<td align="center">47716478</td>
<td align="center">47405948</td>
<td align="center">0.03</td>
<td align="center">97.42</td>
<td align="center">93.11</td>
<td align="center">44.56</td>
</tr>
<tr>
<td align="center">C2_2</td>
<td align="center">45417610</td>
<td align="center">45193820</td>
<td align="center">0.03</td>
<td align="center">97.34</td>
<td align="center">92.87</td>
<td align="center">44.71</td>
</tr>
<tr>
<td align="center">C2_3</td>
<td align="center">48635900</td>
<td align="center">48360212</td>
<td align="center">0.03</td>
<td align="center">97.35</td>
<td align="center">92.94</td>
<td align="center">44.71</td>
</tr>
<tr>
<td align="center">C3_1</td>
<td align="center">45717148</td>
<td align="center">45421208</td>
<td align="center">0.03</td>
<td align="center">97.34</td>
<td align="center">92.95</td>
<td align="center">44.4</td>
</tr>
<tr>
<td align="center">C3_2</td>
<td align="center">44137788</td>
<td align="center">43892366</td>
<td align="center">0.03</td>
<td align="center">97.32</td>
<td align="center">92.87</td>
<td align="center">44.4</td>
</tr>
<tr>
<td align="center">C3_3</td>
<td align="center">47237234</td>
<td align="center">46963976</td>
<td align="center">0.03</td>
<td align="center">97.37</td>
<td align="center">92.94</td>
<td align="center">44.29</td>
</tr>
<tr>
<td align="center">J1_1</td>
<td align="center">43726332</td>
<td align="center">43502176</td>
<td align="center">0.03</td>
<td align="center">97.36</td>
<td align="center">92.95</td>
<td align="center">44.53</td>
</tr>
<tr>
<td align="center">J1_2</td>
<td align="center">45084210</td>
<td align="center">44801296</td>
<td align="center">0.03</td>
<td align="center">97.28</td>
<td align="center">92.84</td>
<td align="center">44.65</td>
</tr>
<tr>
<td align="center">J1_3</td>
<td align="center">47441554</td>
<td align="center">47145802</td>
<td align="center">0.03</td>
<td align="center">97.49</td>
<td align="center">93.23</td>
<td align="center">44.58</td>
</tr>
<tr>
<td align="center">J2_1</td>
<td align="center">46457002</td>
<td align="center">46209204</td>
<td align="center">0.03</td>
<td align="center">97.38</td>
<td align="center">92.98</td>
<td align="center">44.39</td>
</tr>
<tr>
<td align="center">J2_2</td>
<td align="center">46184660</td>
<td align="center">45934398</td>
<td align="center">0.03</td>
<td align="center">97.35</td>
<td align="center">92.93</td>
<td align="center">44.46</td>
</tr>
<tr>
<td align="center">J2_3</td>
<td align="center">41,266,290</td>
<td align="center">41059518</td>
<td align="center">0.03</td>
<td align="center">97.46</td>
<td align="center">93.19</td>
<td align="center">44.68</td>
</tr>
<tr>
<td align="center">J3_1</td>
<td align="center">42274290</td>
<td align="center">42065976</td>
<td align="center">0.03</td>
<td align="center">97.56</td>
<td align="center">93.34</td>
<td align="center">44.31</td>
</tr>
<tr>
<td align="center">J3_2</td>
<td align="center">43887862</td>
<td align="center">43646514</td>
<td align="center">0.03</td>
<td align="center">97.56</td>
<td align="center">93.38</td>
<td align="center">44.61</td>
</tr>
<tr>
<td align="center">J3_3</td>
<td align="center">46624754</td>
<td align="center">46386220</td>
<td align="center">0.03</td>
<td align="center">97.42</td>
<td align="center">93.13</td>
<td align="center">44.39</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Samples of thorns at the three stages: C1, stage 1; C2, stage 2; and C3, stage 3, while stems were at J1, stage 1; J2, stage 2; and J3; stage 3 of maturation.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>The transcript sequence assembled by Trinity was used as the reference sequence for subsequent analysis. After hierarchical clustering by Corset, the longest cluster sequence was obtained for subsequent analysis. The lengths of transcripts and clustered sequences were counted separately, and the results are shown in <xref ref-type="fig" rid="F2">Figure 2</xref>.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Spliced transcripts and gene sequence length distribution map: <bold>(A)</bold> length distribution; <bold>(B)</bold> unigene length distribution; and <bold>(C)</bold> transcript length distribution.</p>
</caption>
<graphic xlink:href="fgene-15-1375488-g002.tif"/>
</fig>
<p>Gene function was annotated using various databases including NCBI, Pfam, KOG/COG, Swiss-Prot, KEGG Ortholog, and GO. A total of 8,937 genes were co-annotated using these databases (as shown in <xref ref-type="fig" rid="F3">Figure 3A</xref>). The FPKM density distribution reflects the gene expression pattern of each sample as a whole. The graph shows a non-standard normal distribution with an area of 1, indicating that the sum of probabilities is 1. The peak of the density distribution curve represents the highest number of genes at the expression level (<xref ref-type="fig" rid="F3">Figure 3B</xref>). In this experiment, hierarchical clustering analysis was performed using the FPKM values of differential genes under different experimental conditions as expression levels. Genes in the same cluster exhibit similar expression level changes under various treatment conditions. Genes within the same group have similar expression patterns and might participate in the same biological processes or have similar functions. As shown in <xref ref-type="fig" rid="F3">Figure 3C</xref>, the gene expression patterns in stages 2 and 3 are significantly different from those in stage 1, both in thorns and stems. Furthermore, the gene expression patterns are notably different between thorns and stems.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Overview of transcriptome analysis: <bold>(A)</bold> number of genes annotated by each database. <bold>(B)</bold> Comparison chart of gene expression levels in different parts at different periods. <bold>(C)</bold> Cluster analysis of differentially expressed genes. Note: Samples of thorns at the three stages: C1, stage 1; C2, stage 2; and C3, stage 3 while stems were at J1, stage 1; J2, stage 2, and J3, stage 3.</p>
</caption>
<graphic xlink:href="fgene-15-1375488-g003.tif"/>
</fig>
</sec>
<sec id="s3-2">
<title>Differentially expressed gene analysis</title>
<p>Compared to the thorn formation stage (stage 1), at the stage of thorns turning hard (stage 2), a total of 1,045 genes were upregulated, and 391 genes were downregulated significantly in thorns (<xref ref-type="fig" rid="F4">Figure 4A</xref>), while 918 genes were upregulated and 784 genes were downregulated markedly in stems (<xref ref-type="fig" rid="F4">Figure 4B</xref>). As the thorns become hard and turn brown (stage 3), a total of 63 genes exhibited a noteworthy increase in expression and 98 genes showed a significant decrease in expression in the thorns (<xref ref-type="fig" rid="F4">Figure 4A</xref>), while 46 genes showed a significant upregulation in expression and 29 genes showed downregulation within the stems, compared with the stage 2 (<xref ref-type="fig" rid="F4">Figure 4B</xref>). The results indicate that stage 2 is the most active period of gene expression during the hardening process of <italic>B</italic>. <italic>glabra</italic> thorns.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Differences in gene expression at three stages. <bold>(A)</bold> Gene expression of thorns. <bold>(B)</bold> Gene expression of stems. Note: Samples of thorns at the three stages- C1- stage 1; C2- stage 2 and C3- stage 3 while stems were at J1- stage 1; J2- stage 2 and J3- stage 3.</p>
</caption>
<graphic xlink:href="fgene-15-1375488-g004.tif"/>
</fig>
</sec>
<sec id="s3-3">
<title>GO enrichment analysis</title>
<p>Active gene expression means vigorous biosynthesis and metabolism in the organism. According to GO enrichment analysis, at the stage of thorns turning hard, the three most gene-enriched biological processes in thorns (C2) were single-organism metabolism, carbohydrate metabolism, and the oxidation&#x2013;reduction process, compared with the early stage of thorn formation (C1). At the same time, the molecular function exhibiting the highest degree of gene enrichment was catalytic activity (<xref ref-type="fig" rid="F5">Figure 5A</xref>). The gene enrichment in stem samples was generally consistent with that observed in thorn samples (<xref ref-type="fig" rid="F5">Figure 5B</xref>). Comparing the gene enrichment analysis at stage 3 with stage 2 of thorns (C3 VS C2), the bioprocess of metabolism was the most enriched, while the molecular function of oxidoreductase activity was enhanced as the top activity. The number of genes enriched in these biological processes decreased significantly when the thorns entered 2&#x2013;3 stage. However, the biological processes in which genes are mainly enriched are still the same three processes&#x2014;the single organism metabolism process, carbohydrate metabolism process, and oxidation&#x2013;reduction process (<xref ref-type="fig" rid="F5">Figure 5C</xref>). The situation of gene enrichment in the thorn (J3 VS J2) samples was comparable to what was noted in the stem samples (<xref ref-type="fig" rid="F5">Figure 5D</xref>).</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>GO gene enrichment analysis shown for stages of thorn and stem maturation: <bold>(A)</bold> C2 vs. C1. <bold>(B)</bold> J2 vs. J1. <bold>(C)</bold> C3 vs. C2. <bold>(D)</bold> J3 vs. J2.</p>
</caption>
<graphic xlink:href="fgene-15-1375488-g005.tif"/>
</fig>
<p>A directed acyclic graph (DAG) was drawn based on the results of differential gene GO enrichment analysis. Further comprehensive analysis of the biological process from stage 1 to stage 3 shows that the synthesis of cellulose is significantly enriched in this process (<xref ref-type="fig" rid="F6">Figure 6</xref>). It is found that genes related to cellulose synthesis are significantly enriched in thorns during this process, whereas genes related to cellulose degradation and synthesis are significantly enriched in the stems. We speculate that degraded cellulose in the stem may be transported to the thorns and participate in their hardening process.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Differential gene GO enrichment DAG plot (partial view). <bold>(A)</bold> C3 VS C1. <bold>(B)</bold> J3 VS J1.</p>
</caption>
<graphic xlink:href="fgene-15-1375488-g006.tif"/>
</fig>
</sec>
<sec id="s3-4">
<title>KEGG enrichment and RT-qPCR analysis and determination of lignin</title>
<p>Through KEGG enrichment analysis, we found that phenylpropanoid biosynthesis was a key step in the hardening process of the thorns of <italic>B</italic>. <italic>glabra</italic>. From stage 1 to stage 3, in thorns, the most significantly enriched pathway was the phenylpropanoid biosynthesis (<xref ref-type="fig" rid="F7">Figure 7</xref>; <xref ref-type="sec" rid="s11">Supplementary Tables S2&#x2013;5</xref>). From stage 1 to stage 2, many genes in phenylpropanoid biosynthesis were upregulated remarkably in thorns (<xref ref-type="fig" rid="F8">Figure 8</xref>). The above results were also verified by RT-qPCR of the important enzymes of the pathway. It indicates that <italic>PAL</italic> (EC:4.3.1.24, K10775, phenylalanine ammonia-lyase) (<xref ref-type="fig" rid="F9">Figure 9A</xref>), <italic>CYP73A</italic> (EC:1.14.14.91, K00487, trans-cinnamate 4-monooxygenase) (<xref ref-type="fig" rid="F9">Figure 9B</xref>), <italic>4CL</italic> (EC:6.2.1.12, K01904, 4-coumarate-CoA ligase) (<xref ref-type="fig" rid="F9">Figure 9C</xref>), <italic>CCR</italic> (EC:1.2.1.44, K09753, cinnamoyl-CoA reductase) (<xref ref-type="fig" rid="F9">Figure 9D</xref>), <italic>CAD</italic> (EC:1.1.1.195, K00083, cinnamyl-alcohol dehydrogenase) (<xref ref-type="fig" rid="F9">Figure 9E</xref>), and <italic>POX</italic> (EC:1.11.1.7, K00430) (<xref ref-type="fig" rid="F9">Figure 9F</xref>) were the key genes for the phenylpropanoid biosynthesis pathway, leading to the structural component of plant secondary cell walls and lignin biosynthesis. The expression levels of these genes exhibited a notable upregulation during the second stage compared with the first stage. The phenylpropanoid biosynthesis is the key step of lignin biosynthesis. The determination of the lignin content in thorns and stems at three stages (<xref ref-type="fig" rid="F9">Figure 9G</xref>) also agreed with the results of transcriptome analysis and RT-qPCR. To sum up, phenylpropanoid biosynthesis is a key step in the hardening process of the thorns of <italic>B</italic>. <italic>glabra</italic> as it was upregulated during maturation with maximum gene expression of the key enzymes during stage 2 of maturation.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>KEGG gene enrichment analysis in thorns and stems: <bold>(A)</bold> KEGG gene enrichment analysis in thorns from stage 1 to stage 2. <bold>(B)</bold> KEGG gene enrichment analysis in thorns from stage 2 to stage 3. <bold>(C)</bold> KEGG gene enrichment analysis in stems from stage 1 to stage 2. <bold>(D)</bold> KEGG gene enrichment analysis in stems from stage 2 to stage 3.</p>
</caption>
<graphic xlink:href="fgene-15-1375488-g007.tif"/>
</fig>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Upregulated genes in phenylpropanoid biosynthesis (C2 VS C1) (Ref: 231673).</p>
</caption>
<graphic xlink:href="fgene-15-1375488-g008.tif"/>
</fig>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption>
<p>Expression profiles of genes using RT-qPCR in the thorns [C1, C2, and C3] and stems [J1, J2, and J3] at three stages of maturation. <bold>(A)</bold> The genes assayed were <italic>PAL</italic> <bold>(B)</bold>, <italic>CYP37A</italic> <bold>(C)</bold>, <italic>4CL</italic> <bold>(D)</bold>, <italic>CCR</italic> <bold>(E)</bold>, <italic>CAD</italic> <bold>(F)</bold>, and <italic>POX</italic>. <bold>(G)</bold> Lignin content in the thorns [C1, C2, and C3] and stems [J1, J2, and J3] at three stages of maturation.</p>
</caption>
<graphic xlink:href="fgene-15-1375488-g009.tif"/>
</fig>
</sec>
<sec id="s3-5">
<title>Transcription factors in transcriptomes and correlation analysis with lignin biosynthesis</title>
<p>From the first stage to the third stage of thorn formation, 2,395 TFs were completely identified in thorns. They included MYB, AP2-EREBP, orphans, C3H, HB, bHLH, WRKY, NAC, C2H2, and bZIP (<xref ref-type="fig" rid="F10">Figure 10A</xref>). In stems, 2,444 TFs were completely identified. They included similar types of TFs as thorns, differing only in the percentage of TFs in each class from thorns (<xref ref-type="fig" rid="F10">Figure 10B</xref>). From the first stage to the second stage of the thorn formation, 39 genes were significantly altered in the phenylpropanoid biosynthesis pathway in thorns (<xref ref-type="sec" rid="s11">Supplementary Table S2</xref>). By correlation analysis, there were many TFs with correlation coefficients greater than 0.8 with these genes. These TFs MYB and HB are the most numerous (<xref ref-type="fig" rid="F10">Figure 10C</xref>).</p>
<fig id="F10" position="float">
<label>FIGURE 10</label>
<caption>
<p>Statistical map of transcription factors with significant differences in different tissues <bold>(A)</bold> Transcription factors with significant differential expression in thorns from the first stage to the third stage. <bold>(B)</bold> Transcription factors with significant differential expression in stems from the first stage to the third stage. <bold>(C)</bold> The top 10&#xa0;TFs correlated with phenylpropanoid synthesis.</p>
</caption>
<graphic xlink:href="fgene-15-1375488-g010.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>In the process of thorns&#x2019; hardening, the synthesis of cellulose is significantly enriched by GO analysis, and the phenylpropanoid biosynthesis is enriched by KEGG analysis (<xref ref-type="fig" rid="F8">Figure 8</xref>). Both the synthesis of cellulose (<xref ref-type="fig" rid="F6">Figure 6</xref>) and lignin (<xref ref-type="fig" rid="F9">Figure 9</xref>) are highly related to the secondary cell wall development, which is supposed to be the important process of thorns&#x2019; hardening.</p>
<p>From stage 1 to stage 3, a continuous accumulation of lignin in thorns of <italic>B</italic>. <italic>glabra</italic> was observed.</p>
<p>Lignin constitutes a polymer resulting from the intricate polymerization of distinct lignin monomers. The process of lignin biosynthesis is orchestrated through the integration of the phenylalanine metabolic pathway and the dedicated lignin-specific pathway. The synthesis of lignin from phenylalanine can be divided into four steps. First, phenylalanine forms p-coumaric acid under the catalysis of phenylalanine ammonia-lyase (<italic>PAL</italic>) and cinnamic acid 4-hydroxylase (<italic>C4H</italic>). Next, p-coumaric acid forms caffeic acid under the catalysis of p-coumarate 3-hydroxylase (<italic>C3H</italic>), caffeic acid forms ferulic acid under the catalysis of caffeic acid O-methyltransferase (<italic>COMT</italic>), and ferulic acid forms 5-hydroxy-ferulic acid under the catalysis of ferulate-5-hydroxylase (<italic>F5H</italic>) and then forms sinapic acid by the catalysis of caffeic acid O-methyltransferase. Subsequently, the phenolic acids previously elucidated undergo catalytic transformation facilitated by a sequence of enzymes. Commencing with 4-coumarate CoA ligase (<italic>4CL</italic>), the process advances through cinnamoyl-CoA reductase (<italic>CCR</italic>) and culminates in cinnamyl alcohol dehydrogenase/sinapyl alcohol dehydrogenase (<italic>CAD</italic>/<italic>SAD</italic>)-mediated reactions. These orchestrated enzymatic steps culminate in the synthesis of distinctive compounds, namely, p-coumaryl alcohol, caffeoyl alcohol, coniferyl alcohol, 5-hydroxy-coniferyl alcohol, and sinapyl alcohol. Ultimately, the trimeric units of lignin&#x2014;namely, p-coumaryl alcohol, coniferyl alcohol, and sinapyl alcohol&#x2014;underwent a process of polymerization catalyzed by peroxidase (<italic>POD</italic>/<italic>PER</italic>/<italic>PRX</italic>) or laccase (<italic>LAC</italic>). This orchestrated transformation yielded three distinct high-molecular weight lignin polymers: p-hydroxyphenyl lignin, guaiacyl lignin, and syringyl lignin (<xref ref-type="bibr" rid="B17">Yoon et al., 2015</xref>). From the formation to hardening of thorns on the stems of <italic>B</italic>. <italic>glabra</italic>, the genes encoded <italic>PAL</italic>, <italic>CCR</italic>, <italic>4CL</italic>, <italic>CAD</italic>, and <italic>POX</italic> are upregulated during this process. At the same time, lignin gradually accumulated in thorns and stems. It was confirmed that the hardening process of the thorns on stems of <italic>B</italic>. <italic>glabra</italic> depended on the lignin accumulation. The lignin accumulation in the thorns of <italic>B</italic>. <italic>glabra</italic> relied on the phenylpropanoid biosynthesis pathway.</p>
<p>TFs play a crucial role in the regulation of gene expression. By binding to specific DNA sequences in the promoter regions of target genes, TFs activate or repress the transcription of those genes to achieve the control of genes expression in a coordinated and regulated manner (<xref ref-type="bibr" rid="B18">Yusuf et al., 2012</xref>). TFs are essential for the normal development and functioning of plants. For example, a class of TFs, NACs, which play important roles in regulating plant growth and development, are involved in secondary cell wall development, seed germination, root development, leaf senescence, floral organ formation, and fruit ripening, as well as mediating plant responses to low temperature, high temperature, drought, flooding, high salt, and disease (<xref ref-type="bibr" rid="B6">Han et al., 2023</xref>).</p>
<p>When it comes to the regulation of lignin synthesis, current research mainly focuses on two types of TFs, NAC and MYB (<xref ref-type="fig" rid="F10">Figure 10</xref>). In <italic>Arabidopsis thaliana</italic>, a three-level regulatory network composed of NAC and MYB jointly regulates the synthesis of lignin, cellulose, and hemicellulose during secondary cell wall thickening in <italic>A</italic>. <italic>thaliana</italic> (<xref ref-type="bibr" rid="B12">Nakano et al., 2015</xref>). In addition to NAC and MYB TFs, lignin synthesis was also regulated by WRKY, bHLH, LBD, LIM, and microRNA, etc. (<xref ref-type="bibr" rid="B3">Behr et al., 2019</xref>). Based on the transcriptome analysis of the three stages, we can further screen the regulatory factors that regulate the accumulation of lignin in thorns, to provide a more scientific basis for the cultivation of soft thorns or thorn-free <italic>B</italic>. <italic>glabra</italic>. In the other study, the content of soluble sugar and starch was measured during the growth and development of the thorn, and transcriptome sequencing of the thorn segment, non-thorn segment, apex, and root tip was performed at five distinct stages of thorn formation. The findings indicate that as <italic>Gleditsia sinensis</italic> underwent maturation, there was a discernible pattern in the soluble sugar content across various plant components, including roots, hypocotyls, thorn stems, thornless stems, and leaves. Additionally, the starch content in roots and leaves exhibited an initial increase, followed by a subsequent decline upon the establishment of the fundamental thorn structure. Notably, the overall trajectory of both soluble sugar and starch content in <italic>G</italic>. <italic>sinensis</italic> demonstrated a consistent decrease, amounting to a reduction of 59.26% and 84.56%, respectively. Genes such as MYB-like, YABBY2, growth-regulating factor 3 (GRF3), TCP2, zinc transporter 8, and additional 25 genes are posited to be associated with the regulation and promotion of thorn maintenance and growth. The GO enrichment analysis conducted on DEGs between stems exhibiting thorns and those without revealed a notable enrichment of DEGs associated with biological processes indicative of positive regulation of development, specifically in the context of heterochronic events (GO:0045962) and the positive modulation of photomorphogenesis (GO:2000306), among other relevant biological process terms. This observation suggests a correlation between the regulation of developmental initiation in <italic>G</italic>. <italic>sinensis</italic> and the involvement of TCP TFs (<xref ref-type="bibr" rid="B15">Xiao et al., 2023</xref>). In our study, we focused on the lignin accumulation relied on the phenylpropanoid biosynthesis pathway. It is believed that lignin accumulation was the key step to forming the thorns. Until now, we cannot find any varieties of <italic>B</italic>. <italic>glabra</italic> that have no thorns. The above studies give us some insights for future studies where we can focus on TFs that act on the phenylalanine metabolic pathway. Lignin accumulation was reduced in thorns using RNA interference and other means, with a view to breeding varieties with soft thorns. Furthermore, if the lignin transport from stems to thorns could be blocked, it might be possible to produce thornless varieties of <italic>B</italic>. <italic>glabra</italic>.</p>
</sec>
<sec sec-type="conclusion" id="s5">
<title>Conclusion</title>
<p>The process of thorn formation and hardening on the stem of <italic>B</italic>. <italic>glabra</italic> involves the gradual accumulation of lignin in the thorns. Several genes are involved in this process, including <italic>PAL</italic> (phenylalanine ammonia-lyase), <italic>CYP73A</italic> (trans-cinnamate 4-monooxygenase), <italic>4CL</italic> (reductase4-coumarate-CoA ligase), <italic>CCR</italic> (cinnamoyl-CoA reductase), <italic>CAD</italic> (cinnamyl-alcohol dehydrogenase), and <italic>POX</italic> (peroxidase). These genes play a crucial role in lignin synthesis and accumulation, which occurs through the phenylpropanoid biosynthesis pathways.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s6">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found at: <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/genbank/,%20PRJNA1015025">https://www.ncbi.nlm.nih.gov/genbank/, PRJNA1015025</ext-link>.</p>
</sec>
<sec id="s7">
<title>Author contributions</title>
<p>LS: funding acquisition, resources, writing&#x2013;original draft, and writing&#x2013;review and editing. HW: investigation and writing&#x2013;review and editing. JL: investigation, resources, and writing&#x2013;review and editing. JG: methodology, resources, and writing&#x2013;review and editing. SY: methodology, software, and writing&#x2013;review and editing. KY: investigation and writing&#x2013;review and editing. EC: methodology and writing&#x2013;review and editing. BL: methodology, resources, and writing&#x2013;review and editing. ZL: data curation and writing&#x2013;review and editing. QC: data curation, formal analysis, and writing&#x2013;review and editing. ML: project administration, supervision, and writing&#x2013;review and editing.</p>
</sec>
<sec sec-type="funding-information" id="s8">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research, authorship, and/or publication of this article. The Natural Science Foundation of Guangxi Science and Technology Department (Project No. 2020GXNSFAA297064), the Guangxi Forestry Science and Technology Promotion Demonstration Project (Contract No. Guilin Scientific Research (2022) No. 11), and the Guangxi Forestry Science and Technology Promotion Demonstration Project (Contract No. 2023GXLK29) funded the study.</p>
</sec>
<sec sec-type="COI-statement" id="s9">
<title>Conflict of interest</title>
<p>Author QC was employed by Nanning GoldTech Biotechnology Ltd.</p>
<p>The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s10">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors, and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fgene.2024.1375488/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fgene.2024.1375488/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material>
<label>SUPPLEMENTARY TABLE S1</label>
<caption>
<p>Primers used in RT-qPCR.</p>
</caption>
</supplementary-material>
<supplementary-material>
<label>SUPPLEMENTARY TABLE S2</label>
<caption>
<p>KEGG-enriched pathways: top 10 (C2 VS C1).</p>
</caption>
</supplementary-material>
<supplementary-material>
<label>SUPPLEMENTARY TABLE S3</label>
<caption>
<p>KEGG-enriched pathways: top 10 (C3 VS C2).</p>
</caption>
</supplementary-material>
<supplementary-material>
<label>SUPPLEMENTARY TABLE S4</label>
<caption>
<p>KEGG-enriched pathways: top 10 (J2 VS J1).</p>
</caption>
</supplementary-material>
<supplementary-material>
<label>SUPPLEMENTARY TABLE S5</label>
<caption>
<p>KEGG-enriched pathways: top 10 (J3 VS J2).</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Table1.pdf" id="SM1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Antonova</surname>
<given-names>G. F.</given-names>
</name>
<name>
<surname>Varaksina</surname>
<given-names>T. N.</given-names>
</name>
<name>
<surname>Zheleznichenko</surname>
<given-names>T. V.</given-names>
</name>
<name>
<surname>Stasova</surname>
<given-names>V. V.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Lignin deposition during earlywood and latewood formation in Scots pine stems</article-title>. <source>Wood Sci. Technol.</source> <volume>48</volume>, <fpage>919</fpage>&#x2013;<lpage>936</lpage>. <pub-id pub-id-type="doi">10.1007/s00226-014-0650-3</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bautista</surname>
<given-names>M. a. C.</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Boufford</surname>
<given-names>D. E.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Phylogeny and taxonomic synopsis of the genus Bougainvillea (Nyctaginaceae)</article-title>. <source>Plants</source> <volume>11</volume>, <fpage>1700</fpage>. <pub-id pub-id-type="doi">10.3390/plants11131700</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Behr</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Guerriero</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Grima-Pettenati</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Baucher</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>A molecular blueprint of lignin repression</article-title>. <source>Trends Plant Sci.</source> <volume>24</volume>, <fpage>1052</fpage>&#x2013;<lpage>1064</lpage>. <pub-id pub-id-type="doi">10.1016/j.tplants.2019.07.006</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Davidson</surname>
<given-names>N. M.</given-names>
</name>
<name>
<surname>Oshlack</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Corset: enabling differential gene expression analysis for <italic>de novo</italic> assembled transcriptomes</article-title>. <source>Genome Biol.</source> <volume>15</volume>, <fpage>410</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-014-0410-6</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Grabherr</surname>
<given-names>M. G.</given-names>
</name>
<name>
<surname>Haas</surname>
<given-names>B. J.</given-names>
</name>
<name>
<surname>Yassour</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Levin</surname>
<given-names>J. Z.</given-names>
</name>
<name>
<surname>Thompson</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Amit</surname>
<given-names>I.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>Full-length transcriptome assembly from RNA-Seq data without a reference genome</article-title>. <source>Nat. Biotechnol.</source> <volume>29</volume>, <fpage>644</fpage>&#x2013;<lpage>652</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.1883</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Han</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>NACs, generalist in plant life</article-title>. <source>Plant Biotechnol. J.</source> <volume>21</volume>, <fpage>2433</fpage>&#x2013;<lpage>2457</lpage>. <pub-id pub-id-type="doi">10.1111/pbi.14161</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kanehisa</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Toward understanding the origin and evolution of cellular organisms</article-title>. <source>Protein Sci.</source> <volume>28</volume>, <fpage>1947</fpage>&#x2013;<lpage>1951</lpage>. <pub-id pub-id-type="doi">10.1002/pro.3715</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kanehisa</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Goto</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>KEGG: kyoto encyclopedia of genes and genomes</article-title>. <source>Nucleic Acids Res.</source> <volume>28</volume>, <fpage>27</fpage>&#x2013;<lpage>30</lpage>. <pub-id pub-id-type="doi">10.1093/nar/28.1.27</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kushwah</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Banasiak</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Nishikubo</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Derba-Maceluch</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Majda</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Endo</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Arabidopsis XTH4 and XTH9 contribute to wood cell expansion and secondary wall formation</article-title>. <source>Plant Physiol.</source> <volume>182</volume>, <fpage>1946</fpage>&#x2013;<lpage>1965</lpage>. <pub-id pub-id-type="doi">10.1104/pp.19.01529</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Dewey</surname>
<given-names>C. N.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>RSEM: accurate transcript quantification from RNA-Seq data with or without a reference genome</article-title>. <source>BMC Bioinforma.</source> <volume>12</volume>, <fpage>323</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-12-323</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Lim</surname>
<given-names>T. K.</given-names>
</name>
</person-group> (<year>2014</year>). &#x201c;<article-title>Bougainvillea glabra</article-title>,&#x201d; in, <source>Edible Medicinal And Non Medicinal Plants</source> (<publisher-loc>Dordrecht, Netherlands</publisher-loc>: <publisher-name>Springer Netherlands</publisher-name>), <comment>Flowers</comment>, <volume>Vol. 8</volume>, <fpage>483</fpage>&#x2013;<lpage>488</lpage>. <pub-id pub-id-type="doi">10.1007/978-94-017-8748-2_33</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nakano</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yamaguchi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Endo</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Rejab</surname>
<given-names>N. A.</given-names>
</name>
<name>
<surname>Ohtani</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>NAC-MYB-based transcriptional regulation of secondary cell wall biosynthesis in land plants</article-title>. <source>Front. Plant Sci.</source> <volume>6</volume>, <fpage>288</fpage>, <pub-id pub-id-type="doi">10.3389/fpls.2015.00288</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun Lina</surname>
<given-names>L. M.</given-names>
</name>
<name>
<surname>Jinhua</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Qin</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Dingjian</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Liao</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Comprehensive evaluation on ornamental value of 30 species of <italic>Bougainvillea glabra</italic> in Guangxi</article-title>. <source>Agric. Res. Appl.</source> <volume>6</volume>, <fpage>1</fpage>&#x2013;<lpage>6</lpage>.</citation>
</ref>
<ref id="B14">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>Z. Y.</given-names>
</name>
<name>
<surname>Raven</surname>
<given-names>P. H.</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>D. Y.</given-names>
</name>
</person-group> (<year>2003</year>). <source>Flora of China</source>. <publisher-loc>Beijing, China</publisher-loc>: <publisher-name>Science Press</publisher-name>.</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xiao</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Comparative transcriptome analysis of Gleditsia sinensis thorns at different stages of development</article-title>. <source>Plants</source> <volume>12</volume>, <fpage>1456</fpage>. <pub-id pub-id-type="doi">10.3390/plants12071456</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Yanjing</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2010</year>). <source>ISSR analysis of germplasm resources of Bongainvillea Brasiliensis Raeusch. Master</source>. <publisher-loc>Fuzhou, China</publisher-loc>: <publisher-name>Fujian Agriculture and Forestry University</publisher-name>.</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yoon</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Choi</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>An</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Roles of lignin biosynthesis and regulatory genes in plant development</article-title>. <source>J. Integr. Plant Biol.</source> <volume>57</volume>, <fpage>902</fpage>&#x2013;<lpage>912</lpage>. <pub-id pub-id-type="doi">10.1111/jipb.12422</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yusuf</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Butland</surname>
<given-names>S. L.</given-names>
</name>
<name>
<surname>Swanson</surname>
<given-names>M. I.</given-names>
</name>
<name>
<surname>Bolotin</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Ticoll</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Cheung</surname>
<given-names>W. A.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>The transcription factor encyclopedia</article-title>. <source>Genome Biol.</source> <volume>13</volume>, <fpage>R24</fpage>. <pub-id pub-id-type="doi">10.1186/gb-2012-13-3-r24</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>