<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2026.1767538</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Influences of organic nitrogen application ratio on oil content in flue-cured tobacco based on field experiments and a random forest model</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Sun</surname><given-names>Zijun</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3121980/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Jiang</surname><given-names>Wanhui</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3121775/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Li</surname><given-names>Huaiyuan</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Liang</surname><given-names>Yaoxing</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Yang</surname><given-names>Xin</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Peng</surname><given-names>Chen</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Shao</surname><given-names>Lanjun</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Yang</surname><given-names>Qihang</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Fu</surname><given-names>Jijiao</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project-administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Chen</surname><given-names>Jianjun</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Deng</surname><given-names>Shiyuan</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>College of Agriculture, South China Agricultural University</institution>, <city>Guangzhou</city>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff2"><label>2</label><institution>Center for Basic Experiments and Practical Training, South China Agricultural University</institution>, <city>Guangzhou</city>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff3"><label>3</label><institution>China Tobacco Guangdong Industrial Co., Ltd.</institution>, <city>Guangzhou</city>,&#xa0;<country country="cn">China</country></aff>
<author-notes>
<corresp id="c001"><label>*</label>Correspondence: Jianjun Chen, <email xlink:href="mailto:chenjianjun@scau.edu.cn">chenjianjun@scau.edu.cn</email>; Shiyuan Deng, <email xlink:href="mailto:yydsy@scau.edu.cn">yydsy@scau.edu.cn</email></corresp>
<fn fn-type="equal" id="fn003">
<label>&#x2020;</label>
<p>These authors have contributed equally to this work and share first authorship</p></fn>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-03-02">
<day>02</day>
<month>03</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>17</volume>
<elocation-id>1767538</elocation-id>
<history>
<date date-type="received">
<day>14</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>11</day>
<month>02</month>
<year>2026</year>
</date>
<date date-type="rev-recd">
<day>06</day>
<month>02</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Sun, Jiang, Li, Liang, Yang, Peng, Shao, Yang, Fu, Chen and Deng.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Sun, Jiang, Li, Liang, Yang, Peng, Shao, Yang, Fu, Chen and Deng</copyright-holder>
<license>
<ali:license_ref start_date="2026-03-02">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<p>Tobacco is a key economic crop, with leaf oil content serving as a critical determinant of leaf quality. To address the limited understanding of mechanisms underlying oil content improvement and the decline in flue-cured tobacco quality caused by long-term reliance on chemical fertilizers, this study integrated field experiments with a machine learning approach. Five treatments with varying organic nitrogen ratios (0%, 10%, 20%, 30%, and 40%) were evaluated at a single experimental site in Hengyang, Hunan. Results indicated that a 30% organic nitrogen ratio significantly enhanced the activity of key lipid metabolism enzymes, promoted the accumulation of lipid metabolites (including cembratriene-diol and sucrose esters), increased glandular trichome density, and improved leaf physical properties such as softness, tensile strength, and thickness, ultimately achieving the highest oil content. Using a robust data augmentation strategy and Recursive Feature Elimination, a Random Forest model was constructed to dissect the complex regulatory network. The model achieved a high predictive accuracy (CV R&#xb2; = 0.819) on the augmented dataset, significantly outperforming the model based on original small-sample data. Feature importance analysis identified petroleum ether extract, cembratriene-diol, leaf softness, reducing sugar, and glandular trichome density as the primary predictors. Significant interactions among these features were also revealed by SHAP dependence plots. These findings provide a theoretical basis for optimizing organic nitrogen application to enhance tobacco leaf oil content and quality in agricultural production.</p>
</abstract>
<kwd-group>
<kwd>flue-cured tobacco</kwd>
<kwd>glandular trichome development</kwd>
<kwd>lipid metabolism</kwd>
<kwd>oil content</kwd>
<kwd>organic nitrogen ratio</kwd>
<kwd>random forest model</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This study was supported by Science and Technology Program of China Tobacco Guangdong Industrial Co., Ltd.(2023440000340020; 2024440000340017).</funding-statement>
</funding-group>
<counts>
<fig-count count="10"/>
<table-count count="3"/>
<equation-count count="4"/>
<ref-count count="45"/>
<page-count count="15"/>
<word-count count="8144"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Crop and Product Physiology</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Flue-cured tobacco is one of the most important economic crops, with China&#x2019;s cultivation area ranking first worldwide (<xref ref-type="bibr" rid="B27">Poltronieri, 2006</xref>; <xref ref-type="bibr" rid="B9">Chen et&#xa0;al., 2019</xref>). Fertilization plays a pivotal role in determining yield and quality (<xref ref-type="bibr" rid="B3">Bender et&#xa0;al., 2023</xref>), yet excessive or imbalanced application can degrade soil resources, waste inputs, and disrupt leaf chemistry (<xref ref-type="bibr" rid="B40">Yan et&#xa0;al., 2025</xref>). The long-term, sole use of chemical fertilizers has become widespread in flue-cured tobacco production, but it reduces soil fertility and deteriorates soil physical and chemical properties, undermining the conditions necessary for producing high-quality tobacco leaves (<xref ref-type="bibr" rid="B17">Gruber and Galloway, 2008</xref>).</p>
<p>Organic fertilizers, sourced from organic waste, supply abundant organic matter and micronutrients while improving soil structure, water retention, fertility, and aeration (<xref ref-type="bibr" rid="B23">Lu et&#xa0;al., 2024</xref>; <xref ref-type="bibr" rid="B31">Shang et&#xa0;al., 2020</xref>). However, their sole application is constrained by slow nutrient release and higher costs (<xref ref-type="bibr" rid="B37">Wang et&#xa0;al., 2020</xref>). Consequently, combining organic and inorganic fertilizers has emerged as a key strategy in sustainable flue-cured tobacco cultivation (<xref ref-type="bibr" rid="B25">Paramesh et&#xa0;al., 2023</xref>).</p>
<p>Nitrogen, an essential macronutrient, is frequently the most limiting factor for plant growth and yield (<xref ref-type="bibr" rid="B45">Zhou et&#xa0;al., 2023</xref>). Overuse of inorganic nitrogen not only wastes resources but also contributes to environmental degradation (<xref ref-type="bibr" rid="B32">Shi et&#xa0;al., 2023</xref>). Optimizing the ratio of organic to inorganic nitrogen can mitigate these issues, improving yield and quality while balancing internal chemical composition (<xref ref-type="bibr" rid="B12">Dinesh et&#xa0;al., 2024</xref>; <xref ref-type="bibr" rid="B41">Yang et&#xa0;al., 2023</xref>). Appropriate organic nitrogen supplementation can promote protein synthesis and enhance oil accumulation, directly contributing to the desirable oiliness of the final cured leaves (<xref ref-type="bibr" rid="B28">Qiu et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B43">Zhang et&#xa0;al., 2021</xref>).</p>
<p>In flue-cured tobacco grading, &#x201c;oil content&#x201d; (sensory score) is a composite, sensory-driven metric reflecting the leaf&#x2019;s surface appearance, texture, and aroma (<xref ref-type="bibr" rid="B16">Gao et&#xa0;al., 2025</xref>). It is subjectively evaluated by experts based on visual and tactile cues. In contrast, Petroleum Ether Extract (PEE) represents the chemical fraction of lipids and other non-polar compounds extracted from the leaf, serving as a quantitative proxy for total lipid content. These characteristics are intricately linked to a network of physical and chemical properties. For instance, increased glandular trichome density elevates the levels of cembratriene-diol (CBT-diol) and sucrose esters (<xref ref-type="bibr" rid="B26">Philippe et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B29">Qu et&#xa0;al., 2018</xref>). As primary constituents of PEE, these metabolites constitute the material basis for the leaf&#x2019;s oily appearance and aroma, thereby influencing the sensory evaluation. Biochemically, the accumulation of these lipid compounds is governed by key enzymes that dictate metabolic flux. Fatty acid synthase (FAS) is central to <italic>de novo</italic> fatty acid synthesis, directly promoting fatty acid accumulation (<xref ref-type="bibr" rid="B10">Chen et&#xa0;al., 2025</xref>). Phosphoenolpyruvate carboxylase (PEPC), a key enzyme in carbon fixation, supplies precursors for amino acid and organic acid synthesis, thereby influencing overall metabolic flux and strengthening carbon-nitrogen synergy, which in turn promotes the accumulation of total and reducing sugars (<xref ref-type="bibr" rid="B13">Fan et&#xa0;al., 2013</xref>). Furthermore, phosphatidic acid phosphatase (PAP) is critical for lipid metabolism and phospholipid regulation, with its catalyzed reactions being crucial steps for triacylglycerol synthesis and storage (<xref ref-type="bibr" rid="B8">Carman and Han, 2009</xref>, <xref ref-type="bibr" rid="B7">Carman and Han, 2006</xref>). The collective activity of these enzymes influences the levels of pyruvic acid (PA), total phenols (TP), and other sugars, indirectly shaping the final lipid composition and sensory profile of cured leaves. However, the strong interdependence of these structural and biochemical indicators often causes severe multicollinearity, complicating efforts to isolate each factor&#x2019;s true contribution using conventional statistical approaches.</p>
<p>To address these challenges and elucidate the underlying mechanisms, this study employs a Random Forest (RF) model, which effectively captures non-linear relationships, variable interactions, and high-dimensional dependencies while remaining robust to noise and overfitting (<xref ref-type="bibr" rid="B34">Swamy et&#xa0;al., 2025</xref>). As a non-parametric method, RF builds an ensemble of Classification and Regression Trees (CART) (<xref ref-type="bibr" rid="B30">Seifert et&#xa0;al., 2020</xref>). These capabilities have led to its wide adoption in diverse disciplines, such as ecological prediction and expression-based interpretation (<xref ref-type="bibr" rid="B39">Xavier and Wilfried, 2009</xref>; <xref ref-type="bibr" rid="B5">Bureau et&#xa0;al., 2005</xref>). RF is a powerful ensemble learning method capable of handling non-linear relationships and high-dimensional interactions (<xref ref-type="bibr" rid="B18">He et&#xa0;al., 2024</xref>), making it ideal for dissecting complex agronomic traits. To enhance interpretability, we combined RF with feature attribution and visualization tools, including Mean Decrease in Impurity (MDI) for feature importance, Partial Dependence Plots (PDP), and SHAP (SHapley Additive exPlanations) value analysis. This multifaceted approach aims to yield a transparent and interpretable model (<xref ref-type="bibr" rid="B4">Bouni et&#xa0;al., 2024</xref>; <xref ref-type="bibr" rid="B2">B&#xe9;nard et&#xa0;al., 2022</xref>), enabling both global and local insights into how key physicochemical indicators regulate oil content and reveals complex interactions among them.</p>
<p>This study aims to (1) elucidate the mechanisms by which organic nitrogen ratios influence the oil content of flue-cured tobacco through key physicochemical pathways, (2) identify the optimal organic nitrogen ratio for maximizing oil content, and (3) establish a data-driven framework for more precise evaluation and management of tobacco leaf quality in agricultural production. Here, we show that a 30% organic nitrogen ratio achieves the highest oil content by optimizing a suite of interconnected physicochemical traits. Using an optimized RF model on augmented data, we identified PEE, CBT-diol, and leaf softness as the most influential predictors. Our results further reveal that this optimal nitrogen ratio promotes oil content by stimulating lipid metabolism and glandular trichome development, establishing a clear, data-driven connection between fertilization strategy and final leaf quality.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Experimental materials and site description</title>
<p>The field experiment was conducted from March to July 2024 in Hexi Village, Guanshi Town, Hengnan County, Hengyang City, Hunan Province, China (26&#xb0;43&#x2032;12&#x2033;N, 112&#xb0;50&#x2032;55&#x2033;E; altitude 70 m), The region has a subtropical monsoon climate, with an average temperature of approximately 24 &#xb0;C and precipitation of 800 mm during the tobacco growing season (March-July). The flue-cured tobacco variety used in this study was &#x2018;Yunyan 87&#x2019;. The site, previously cultivated with rice, had the following basic soil properties: pH 7.46, total nitrogen 2.47 g&#xb7;kg<sup>-</sup>&#xb9;, total potassium 1.69 g&#xb7;kg<sup>-</sup>&#xb9;, total phosphorus 0.95 g&#xb7;kg<sup>-</sup>&#xb9;, alkali-hydrolyzable nitrogen 90.44 mg&#xb7;kg<sup>-</sup>&#xb9;, available potassium 379.90 mg&#xb7;kg<sup>-</sup>&#xb9;, available phosphorus 49.63 mg&#xb7;kg<sup>-</sup>&#xb9;, and organic matter 43.16 g&#xb7;kg<sup>-</sup>&#xb9;.</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Experimental design</title>
<p>The experiment was arranged in a randomized complete block design with three replicates. Under a constant total N application rate (165 kg&#xb7;N&#xb7;ha<sup>-</sup>&#xb9;), five treatments with varying proportions of organic N were established: ON0 (0% organic N), ON10 (10%), ON20 (20%), ON30 (30%), and ON40 (40%), totaling 15 plots. Guard rows were established around the experimental area, and the planting density was maintained at 17,250 plants ha<sup>-</sup>&#xb9;. The fertilizers used included a specialized basal fertilizer for tobacco (8% N, 10% P<sub>2</sub>O<sub>5</sub>, 11% K<sub>2</sub>O), a starter fertilizer (20% N, 9% P<sub>2</sub>O<sub>5</sub>), a specialized topdressing fertilizer for tobacco (10% N, 32% K<sub>2</sub>O), potassium sulfate (52% K<sub>2</sub>O), potassium magnesium sulfate (25% K<sub>2</sub>O), and superphosphate (12% P<sub>2</sub>O<sub>5</sub>). The organic N source was a bio-fermented rapeseed cake fertilizer (2.4% TN, 1.05% TP, 2.55% TK). All other agronomic practices followed the 2024 technical guidelines provided by the Hengyang City Company of the Hunan Provincial Tobacco Monopoly Bureau. Detailed fertilization data for each treatment are provided in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;1</bold></xref>.</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Sample collection and classification</title>
<p>To ensure consistency, samples were collected at two distinct stages targeting specific physiological and quality indicators. First, 90 days after transplantation, fresh leaf samples were collected from the sixth leaf position (starting from the top), and 10 leaves were collected from each replicate. After removal of the veins, the leaves were stored at -80&#xb0;C for determination of physiological and biochemical indexes, including enzyme activities (FAS, PEPC, PAP) and metabolite contents (PA, TP). Second, after the flue-curing process, cured leaves of the B2F grade (upper leaves) were selected to measure chemical components (PEE, TS, RS), physical properties (softness, tensile strength, thickness), and the sensory oil content score.</p>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Determination of lipid metabolism-related products</title>
<p>The contents of pyruvic acid (PA), total phenols (TP), and the activities of FAS, PEPC, and PAP were measured using reagent kits from Suzhou Grace Biotechnology Co., Ltd. (Suzhou, China). The mass of all measured samples was 0.1 g, and the volume of solvent was 1 mL.</p>
<p>The content of PA was determined based on its reaction with 2,4-dinitrophenylhydrazine to form 2,4-dinitrophenylhydrazone, a brownish-red hydrazone in an alkaline solution. Absorbance was measured at 520 nm.</p>
<p>The TP content was measured using the Folin-Ciocalteu method, based on phenol-induced reduction of tungstomolybdic acid, producing a blue complex (760 nm).</p>
<p>FAS activity was monitoring NADPH consumption (absorbance at 340 nm) during conversion of acetyl-CoA and malonyl-CoA to long-chain fatty acids.</p>
<p>PEPC activity was assessed through coupled reactions with malate dehydrogenase, tracking NADH oxidation at 340 nm. PAP activity was determined via &#x3b2;-glycerophosphate hydrolysis, detecting liberated inorganic phosphate using a phosphorus-specific reagent.</p>
<p>All assays were conducted in 96-well microtiter plates, with triplicate technical replicates.</p>
<p>The contents of total sugar (TS) and reducing sugar (RS) were determined following YC/T 159-2002, and petroleum ether extract (PEE) was measured according to YC/T 176-2003.</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Observation and density statistics of glandular trichomes</title>
<p>During the germination period, the upper surface of the first mature leaf (from top to bottom) was taken, stained with 0.2% (w/v) Rhodamine B for 30 minutes, rinsed three times with distilled water, and blotted dry. Glandular trichome density was quantified using a digital microscope (VHX-500F, KEYENCE Corporation, Japan) by analyzing three random fields from the central upper epidermis.</p>
</sec>
<sec id="s2_6">
<label>2.6</label>
<title>Determination of glandular trichome secretions</title>
<p>The first mature leaf (from top to bottom) was taken during the germination period. Leaf discs with a diameter of 5 cm were cut from the leaves. Fifty leaf discs constituted one biological replicate, and three biological replicates were prepared for each material. The leaf discs were extracted by dipping them eight times (2 s each) into a dichloromethane solution. A 1 mL internal standard solution (a mixture of 2.020 mg&#xb7;ml<sup>-</sup>&#xb9; sucrose octaacetate and 2.542 mg&#xb7;ml<sup>-</sup>&#xb9; n-heptadecanol) was added to the extract. After thorough mixing, the solution was filtered and then concentrated using a rotary evaporator (LCA-RN-1300BE, Shanghai Lichen Instrument Technology Co., Ltd.). The concentrate was dried under a nitrogen stream using a nitrogen evaporator (LC-DCY-12GP, Shanghai Lichen Instrument Technology Co., Ltd.). The dried residue was subsequently silylated and analyzed by GC-MS (7890B-5977A, Agilent Technologies Inc., USA).</p>
</sec>
<sec id="s2_7">
<label>2.7</label>
<title>Measurement of physical properties of cured leaves</title>
<p>The leaf softness value (mN) was measured longitudinally and transversely using a softness tester (YT-RRY1000, Hangzhou Yante Technology Co., Ltd.). The tensile strength was determined with a force gauge (SF-10, Wenzhou Weidu Electronics Co., Ltd.), and the thickness was determined using a high-precision thickness gauge (547-401, Mitutoyo Corporation, Japan).</p>
</sec>
<sec id="s2_8">
<label>2.8</label>
<title>Evaluation of oil content in cured tobacco leaves</title>
<p>Oil content was scored based on GB 2635-92 (&#x201c;Grading of Flue-cured Tobacco&#x201d;), supplemented by expert input: abundant (9&#x2013;10 points), present (6&#x2013;8 points), slightly present (3&#x2013;5 points), and sparse (0&#x2013;2 points). Evaluators were blinded to the specific treatments to minimize bias. The scores were treated as a continuous variable for regression modeling, a common practice in sensory analysis to capture subtle quality gradients.</p>
</sec>
<sec id="s2_9">
<label>2.9</label>
<title>RF model construction and design</title>
<p>The model was developed using the RandomForestRegressor class from the scikit-learn library in Python. The standardized key indicators were used as input features, and the original oil content scores served as the target variable. To overcome the limitations of a small sample size (N = 15 biological replicates) and to capture robust non-linear relationships, we implemented a comprehensive modeling framework involving data augmentation, recursive feature elimination (RFE), and hyperparameter optimization.</p>
<sec id="s2_9_1">
<label>2.9.1</label>
<title>Data augmentation strategy</title>
<p>We employed a two-step data augmentation strategy to expand the dataset to N = 45, thereby enhancing model generalizability. First, synthetic samples were generated by injecting Gaussian noise into the original feature vectors, scaled to 3% of the standard deviation of each feature to simulate natural biological variability. Second, linear interpolation was performed between randomly selected pairs of original samples, mimicking intermediate physiological states. A random seed was fixed to ensure reproducibility.</p>
</sec>
<sec id="s2_9_2">
<label>2.9.2</label>
<title>Feature selection via recursive feature elimination</title>
<p>To address potential multicollinearity and identify the most informative predictors, we utilized Recursive Feature Elimination with Cross-Validation (RFECV). This method iteratively removed the least important features based on model accuracy until the optimal feature subset was identified. The selection process was guided by maximizing the R&#xb2; score under 3-fold cross-validation, ensuring that the final model relied only on non-redundant, high-impact indicators.</p>
</sec>
<sec id="s2_9_3">
<label>2.9.3</label>
<title>Model optimization and training</title>
<p>The Random Forest model was trained on the augmented dataset using the selected features. Instead of arbitrary parameter setting, we employed GridSearchCV to systematically optimize key hyperparameters, including the number of estimators (n_estimators), maximum tree depth (max_depth), and minimum samples per leaf (min_samples_leaf). The final model&#x2019;s prediction for a new sample <inline-formula>
<mml:math display="inline" id="im1"><mml:mrow><mml:msup><mml:mi>x</mml:mi><mml:mo>&#x2032;</mml:mo></mml:msup><mml:mo>&#xa0;</mml:mo></mml:mrow></mml:math></inline-formula> is the average of the predictions from all <inline-formula>
<mml:math display="inline" id="im2"><mml:mi>B</mml:mi></mml:math></inline-formula> decision trees in the forest. The equation is shown as <xref ref-type="disp-formula" rid="eq1">Equation&#xa0;1</xref>.</p>
<disp-formula id="eq1"><label>(1)</label>
<mml:math display="block" id="M1"><mml:mrow><mml:mtable><mml:mtr><mml:mtd><mml:mrow><mml:mover accent="true"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mrow><mml:mi>r</mml:mi><mml:mi>f</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="true">^</mml:mo></mml:mover><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:msup><mml:mi>x</mml:mi><mml:mo>&#x2032;</mml:mo></mml:msup><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>B</mml:mi></mml:mfrac><mml:munderover><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>b</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>B</mml:mi></mml:munderover><mml:msub><mml:mi>T</mml:mi><mml:mi>b</mml:mi></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:msup><mml:mi>x</mml:mi><mml:mo>&#x2032;</mml:mo></mml:msup><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math display="inline" id="im3"><mml:mi>B</mml:mi></mml:math></inline-formula> is the total number of decision trees in the forest, and <inline-formula>
<mml:math display="inline" id="im4"><mml:mrow><mml:msub><mml:mi>T</mml:mi><mml:mi>b</mml:mi></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:msup><mml:mi>x</mml:mi><mml:mo>&#x2032;</mml:mo></mml:msup><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow></mml:math></inline-formula> represents the prediction of the <inline-formula>
<mml:math display="inline" id="im5"><mml:mi>b</mml:mi></mml:math></inline-formula>-th tree for sample <inline-formula>
<mml:math display="inline" id="im6"><mml:msup><mml:mi>x</mml:mi><mml:mo>&#x2032;</mml:mo></mml:msup></mml:math></inline-formula>.</p>
</sec>
<sec id="s2_9_4">
<label>2.9.4</label>
<title>Model evaluation and interpretation</title>
<p>The overall performance of the model was evaluated using both Out-of-Bag (OOB) estimation and K-fold Cross-Validation (CV, K = 3). The OOB R&#xb2; provides an estimate of the model&#x2019;s generalization performance by using the one-third of the data left out of the bootstrap sample for each tree as a validation set. The cross-validation R&#xb2; is calculated by partitioning the data into K mutually exclusive subsets, iteratively training the model on K-1 subsets and testing on the remaining one, and then averaging the performance. The equation is shown as <xref ref-type="disp-formula" rid="eq2">Equation&#xa0;2</xref>.</p>
<disp-formula id="eq2"><label>(2)</label>
<mml:math display="block" id="M2"><mml:mrow><mml:mtable><mml:mtr><mml:mtd><mml:mrow><mml:msubsup><mml:mi>R</mml:mi><mml:mrow><mml:mi>C</mml:mi><mml:mi>V</mml:mi></mml:mrow><mml:mn>2</mml:mn></mml:msubsup><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>&#x2212;</mml:mo><mml:mfrac><mml:mrow><mml:msub><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>&#x2208;</mml:mo><mml:mtext>TestData</mml:mtext></mml:mrow></mml:msub><mml:msup><mml:mrow><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mover accent="true"><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mo>,</mml:mo><mml:mi>C</mml:mi><mml:mi>V</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="true">^</mml:mo></mml:mover></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mrow><mml:mrow><mml:msub><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>&#x2208;</mml:mo><mml:mtext>TestData</mml:mtext></mml:mrow></mml:msub><mml:msup><mml:mrow><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mover accent="true"><mml:mi>y</mml:mi><mml:mo>&#xaf;</mml:mo></mml:mover></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:mfrac></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math display="inline" id="im7"><mml:mrow><mml:mover accent="true"><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mo>,</mml:mo><mml:mi>C</mml:mi><mml:mi>V</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="true">^</mml:mo></mml:mover></mml:mrow></mml:math></inline-formula> is the prediction for sample i when it was in the held-out fold, <inline-formula>
<mml:math display="inline" id="im8"><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is the true value, and <inline-formula>
<mml:math display="inline" id="im9"><mml:mover accent="true"><mml:mi>y</mml:mi><mml:mo>&#xaf;</mml:mo></mml:mover></mml:math></inline-formula> is the mean of the true values for all samples.</p>
<p>To gain deeper insights into the RF model and uncover underlying mechanisms, we first quantified the global relative importance of each input feature in predicting oil content by calculating the Mean Decrease in Impurity (MDI). Second, we utilized Partial Dependence Plots (PDP) to visualize the marginal effect of changing a single feature on the model&#x2019;s average prediction. The equation is shown as <xref ref-type="disp-formula" rid="eq3">Equation&#xa0;3</xref>.</p>
<disp-formula id="eq3"><label>(3)</label>
<mml:math display="block" id="M3"><mml:mrow><mml:mtable><mml:mtr><mml:mtd><mml:mrow><mml:mover accent="true"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow><mml:mo stretchy="true">^</mml:mo></mml:mover><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>&#x2248;</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:munderover><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover><mml:mover accent="true"><mml:mi>f</mml:mi><mml:mo>^</mml:mo></mml:mover><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mi>x</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>,</mml:mo><mml:msubsup><mml:mi>x</mml:mi><mml:mi>C</mml:mi><mml:mrow><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mi>i</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow></mml:msubsup></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math display="inline" id="im10"><mml:mover accent="true"><mml:mi>f</mml:mi><mml:mo>^</mml:mo></mml:mover></mml:math></inline-formula> is the trained RF model, <inline-formula>
<mml:math display="inline" id="im11"><mml:mi>n</mml:mi></mml:math></inline-formula> is the number of samples, and <inline-formula>
<mml:math display="inline" id="im12"><mml:mrow><mml:msubsup><mml:mi>x</mml:mi><mml:mi>C</mml:mi><mml:mrow><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mi>i</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow></mml:msubsup></mml:mrow></mml:math></inline-formula> represents the values except feature <inline-formula>
<mml:math display="inline" id="im13"><mml:mi>j</mml:mi></mml:math></inline-formula> for the <inline-formula>
<mml:math display="inline" id="im14"><mml:mi>i</mml:mi></mml:math></inline-formula>-th sample.</p>
<p>Concurrently, SHapley Additive exPlanations (SHAP) value analysis was introduced. Using the TreeExplainer algorithm from the shap library, we calculated the contribution of each feature to the final prediction for every individual sample. SHAP values satisfy the property of additivity, meaning the difference between an individual prediction and the average prediction is equal to the sum of the SHAP values for all features of that sample. The equation is shown as <xref ref-type="disp-formula" rid="eq4">Equation&#xa0;4</xref>.</p>
<disp-formula id="eq4"><label>(4)</label>
<mml:math display="block" id="M4"><mml:mrow><mml:mtable><mml:mtr><mml:mtd><mml:mrow><mml:mover accent="true"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mrow><mml:mi>r</mml:mi><mml:mi>f</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="true">^</mml:mo></mml:mover><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msubsup><mml:mi>x</mml:mi><mml:mi>i</mml:mi><mml:mo>'</mml:mo></mml:msubsup></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>&#x2212;</mml:mo><mml:mi>E</mml:mi><mml:mrow><mml:mo stretchy="false">[</mml:mo><mml:mrow><mml:mover accent="true"><mml:mrow><mml:msub><mml:mi>f</mml:mi><mml:mrow><mml:mi>r</mml:mi><mml:mi>f</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="true">^</mml:mo></mml:mover><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:msup><mml:mi>X</mml:mi><mml:mo>&#x2032;</mml:mo></mml:msup><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mo stretchy="false">]</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:munderover><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>D</mml:mi></mml:munderover><mml:msub><mml:mi>&#x3d5;</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math display="inline" id="im15"><mml:mrow><mml:msub><mml:mi>&#x3d5;</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> is the contribution of feature <inline-formula>
<mml:math display="inline" id="im16"><mml:mi>j</mml:mi></mml:math></inline-formula> to the prediction for sample <inline-formula>
<mml:math display="inline" id="im17"><mml:mi>i</mml:mi></mml:math></inline-formula>, and <inline-formula>
<mml:math display="inline" id="im18"><mml:mi>D</mml:mi></mml:math></inline-formula> is the feature dimension.</p>
<p>These values were visualized through SHAP summary and dependence plots to provide a more comprehensive local and global model interpretation. Model diagnostics were performed by analyzing the distribution of cross-validation residuals (Shapiro-Wilk test for normality), the relationship between residuals and predicted values, and Q-Q plots.</p>
</sec>
</sec>
<sec id="s2_10">
<label>2.10</label>
<title>Data processing and statistical analysis</title>
<p>Data were processed using Excel 2021, SPSS 19.0, and Pycharm 2024. Line graphs and bar charts were produced with OriginPro 2024. One-way analysis of variance (ANOVA) followed by Duncan&#x2019;s new multiple range test was used for variance analysis. The Spearman method was used to calculate correlation coefficients.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>Glandular trichome density and secretion content</title>
<p>During the budding stage, the morphology and density of glandular trichomes on the upper leaves were observed and quantified for each treatment. <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref> shows the density of segmented long-stalked glandular hairs gradually increases from ON0 to ON30, but significantly decreases at ON40. The results showed that glandular trichome density followed the order of ON30 &gt; ON20 &gt; ON10 &gt; ON40 &gt; ON0. Specifically, ON30 exhibited a 50.98% increase in total trichome density compared to ON0 (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2A</bold></xref>). The density pattern of long-stalked glandular trichomes, key sites for secretion, mirrored that of total trichomes, with ON30 showing a 53.24% increase compared to ON0. Short-stalked trichome density was highest in ON20; while differences among organic nitrogen treatments were not significant, all exceeded ON0 significantly. Non-secretory epidermal trichomes showed no treatment differences.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Morphology of glandular trichomes on flue-cured tobacco leaves under different organic nitrogen treatments. Representative Ultra-Depth Three-Dimensional microscope images showing the cross-sections of fresh tobacco leaf epidermes at the budding stage. The panels display the effects of treatments with varying organic nitrogen to total nitrogen ratios: ON0 (0%), ON10 (10%), ON20 (20%), ON30 (30%), and ON40 (40%). The images show various trichome types, including prominent long-stalked glandular trichomes (characterized by multi-cellular stalks and secretory heads) and shorter-stalked glandular trichomes. An increase in trichome density, particularly of the long-stalked type, is observable in the ON30 treatment compared to the ON0 control. Scale bars = 200 &#x3bc;m.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767538-g001.tif">
<alt-text content-type="machine-generated">Microscope images show plant surfaces labeled ON0, ON10, ON20, ON30, and ON40, each displaying varying densities and arrangements of hair-like trichomes. A 200 micrometer scale bar appears in each panel for reference.</alt-text>
</graphic></fig>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Density of glandular trichomes and content of secretions in tobacco under different treatments. <bold>(A)</bold> Density of total, long-stalked, short-stalked, and non-glandular trichomes. <bold>(B)</bold> Content of cembratriene-diol (CBT-diol) and sucrose fatty acid esters on the leaf surface. The treatments correspond to varying organic nitrogen to total nitrogen ratios: ON0 (0%), ON10 (10%), ON20 (20%), ON30 (30%), and ON40 (40%). Data are presented as the mean &#xb1; standard error (SE) of three biological replicates. Different lowercase letters above the bars indicate significant differences among treatments at the p&lt; 0.05 level, as determined by one-way ANOVA followed by Duncan&#x2019;s multiple range test. CBT-diol: Cembratriene-diol.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767538-g002.tif">
<alt-text content-type="machine-generated">Grouped bar charts compare trichome density and specific metabolite content across five ON treatments, with panel A showing highest trichome and long-glandular trichome density for ON30, and panel B showing highest CBT-diol for ON30 and highest sucrose fatty acid esters for ON30 and ON20. Error bars and significance letters indicate statistical differences between treatments.</alt-text>
</graphic></fig>
<p>GC&#x2013;MS analysis of trichome secretions revealed that the contents of all measured compounds in ON20, ON30, and ON40 were significantly higher than in ON0 (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2B</bold></xref>). The largest increase occurred in ON30, where cembratriene-diol (CBT-diol) content rose by 68.13% and sucrose esters by 47.39% compared to ON0, paralleling the elevated density of the long-stalked trichomes.</p>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Activities of lipid metabolism-related enzymes</title>
<p>Organic nitrogen ratio significantly influenced lipid-related enzyme activities (<xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>). FAS activity peaked in ON30, showing a 27.8% increase over ON0 and exceeded ON10 and ON20 significantly. Although slightly lower in ON40, FAS activity remained significantly above ON0. PAP activity significantly increased only in ON30 (by 44.2% compared to NO0), with other treatments showing non-significant increases. Similarly, PEPC activity also peaked in ON30, rising 82.3% over ON0, and was significantly higher than in all other treatments. Taken together, ON30 (a moderately high level of organic nitrogen) maximized FAS, PAP, and PEPC activities.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Activities of lipid metabolism-related enzymes in flue-cured tobacco under different organic nitrogen ratios.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Treatment</th>
<th valign="middle" align="center">FAS<break/>(nmol&#xb7;min<sup>-1&#xb7;</sup>g<sup>-1</sup>)</th>
<th valign="middle" align="center">PAP<break/>(&#x3bc;mol&#xb7;h<sup>-1&#xb7;</sup>g<sup>-1</sup>)</th>
<th valign="middle" align="center">PEPC<break/>(nmol&#xb7;min<sup>-1</sup>&#xb7;g<sup>-1</sup>)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">ON0</td>
<td valign="middle" align="center">68.24 &#xb1; 5.72c</td>
<td valign="middle" align="center">12.31 &#xb1; 0.48b</td>
<td valign="middle" align="center">267.24 &#xb1; 7.15c</td>
</tr>
<tr>
<td valign="middle" align="center">ON10</td>
<td valign="middle" align="center">66.81 &#xb1; 0.71c</td>
<td valign="middle" align="center">13.16 &#xb1; 0.90b</td>
<td valign="middle" align="center">257.95 &#xb1; 1.89c</td>
</tr>
<tr>
<td valign="middle" align="center">ON20</td>
<td valign="middle" align="center">72.88 &#xb1; 3.76bc</td>
<td valign="middle" align="center">13.40 &#xb1; 0.72b</td>
<td valign="middle" align="center">345.12 &#xb1; 16.09b</td>
</tr>
<tr>
<td valign="middle" align="center">ON30</td>
<td valign="middle" align="center">87.17 &#xb1; 4.21a</td>
<td valign="middle" align="center">17.75 &#xb1; 0.35a</td>
<td valign="middle" align="center">487.32 &#xb1; 1.43a</td>
</tr>
<tr>
<td valign="middle" align="center">ON40</td>
<td valign="middle" align="center">81.82 &#xb1; 3.73ab</td>
<td valign="middle" align="center">13.80 &#xb1; 0.55b</td>
<td valign="middle" align="center">336.55 &#xb1; 12.19b</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Different lowercase letters following the data in the same column indicate significant differences among treatments at the 0.05 level. The same notation applies to subsequent tables. FAS: Fatty acid synthase, PAP: Phosphatidic acid phosphatase, PEPC: Phosphoenolpyruvate carboxylase.</p>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Content of key lipid metabolism-related products</title>
<p>The contents of PEE, PA, TP, TS, and RS were analyzed in cured leaves (<xref ref-type="table" rid="T2"><bold>Table&#xa0;2</bold></xref>). PEE content was highest in ON30, showing an 18.44% increase compared to Ono, while other treatments did not differ significantly from ON0. PA content decreased significantly in ON30 and ON40 (-17.63% and -5.93%, respectively), whereas ON10 showed a slight increase over ON0. TP content decreased significantly across all treatments compared to ON0, likely reflecting enhanced pyruvate metabolism and downstream diterpenoid biosynthesis, suppressing the phenylpropanoid pathway. Both TS and RS increased with organic nitrogen up to ON30, where they peaked (+43.19% and +64.31% vs. ON0, respectively), before declining in ON40.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Content of key lipid metabolism-related products in cured tobacco leaves under different organic nitrogen ratios.Units: mg&#xb7;g<sup>-1</sup>.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Treatment</th>
<th valign="middle" align="center">PEE</th>
<th valign="middle" align="center">PA</th>
<th valign="middle" align="center">TP</th>
<th valign="middle" align="center">TS</th>
<th valign="middle" align="center">RS</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">ON0</td>
<td valign="middle" align="center">107.37 &#xb1; 0.56b</td>
<td valign="middle" align="center">6.24 &#xb1; 0.05a</td>
<td valign="middle" align="center">98.54 &#xb1; 0.65a</td>
<td valign="middle" align="center">210.66 &#xb1; 1.18e</td>
<td valign="middle" align="center">163.86 &#xb1; 0.67e</td>
</tr>
<tr>
<td valign="middle" align="center">ON10</td>
<td valign="middle" align="center">114.79 &#xb1; 1.45b</td>
<td valign="middle" align="center">6.30 &#xb1; 0.01a</td>
<td valign="middle" align="center">82.09 &#xb1; 0.37c</td>
<td valign="middle" align="center">259.75 &#xb1; 2.36d</td>
<td valign="middle" align="center">222.8 &#xb1; 1.41d</td>
</tr>
<tr>
<td valign="middle" align="center">ON20</td>
<td valign="middle" align="center">114.37 &#xb1; 4.03b</td>
<td valign="middle" align="center">6.17 &#xb1; 0.09a</td>
<td valign="middle" align="center">84.19 &#xb1; 2.33bc</td>
<td valign="middle" align="center">269.66 &#xb1; 1.39c</td>
<td valign="middle" align="center">240.37 &#xb1; 0.53c</td>
</tr>
<tr>
<td valign="middle" align="center">ON30</td>
<td valign="middle" align="center">127.18 &#xb1; 1.13a</td>
<td valign="middle" align="center">5.14 &#xb1; 0.03c</td>
<td valign="middle" align="center">86.77 &#xb1; 0.21b</td>
<td valign="middle" align="center">301.71 &#xb1; 0.8a</td>
<td valign="middle" align="center">269.25 &#xb1; 0.93a</td>
</tr>
<tr>
<td valign="middle" align="center">ON40</td>
<td valign="middle" align="center">112.74 &#xb1; 2.16b</td>
<td valign="middle" align="center">5.87 &#xb1; 0.04b</td>
<td valign="middle" align="center">84.22 &#xb1; 0.56bc</td>
<td valign="middle" align="center">288.24 &#xb1; 1.85b</td>
<td valign="middle" align="center">252.49 &#xb1; 0.2b</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>PEE, Petroleum ether extract, PA, Pyruvic acid, TP: Total phenols, TS, Total sugar, RS, Reducing sugar.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Physical properties of cured leaves</title>
<p>Leaf softness, tensile strength, and thickness responded non-linearly to organic nitrogen (<xref ref-type="table" rid="T3"><bold>Table&#xa0;3</bold></xref>). Softness value (inversely related to softness) decreased then increased with rising organic nitrogen, reaching its lowest (softest) point in ON30, significantly below all other treatments. Tensile strength and leaf thickness followed a rising&#x2013;falling trend, both peaking in ON30. All treatments except ON0 produced leaves within the optimal thickness range (120&#x2013;140 &#x3bc;m) for upper leaves, with ON30 yielding the thickest leaves.</p>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Physical properties of cured tobacco leaves under different organic nitrogen ratios.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Treatment</th>
<th valign="middle" align="center">Softness (mN)</th>
<th valign="middle" align="center">Tensile strength (N)</th>
<th valign="middle" align="center">Thickness (&#x3bc;m)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">ON0</td>
<td valign="middle" align="center">49.74 &#xb1; 0.82a</td>
<td valign="middle" align="center">3.47 &#xb1; 0.29c</td>
<td valign="middle" align="center">116.78 &#xb1; 2.29d</td>
</tr>
<tr>
<td valign="middle" align="center">ON10</td>
<td valign="middle" align="center">41.52 &#xb1; 2.31b</td>
<td valign="middle" align="center">3.94 &#xb1; 0.15b</td>
<td valign="middle" align="center">125.23 &#xb1; 1.93bc</td>
</tr>
<tr>
<td valign="middle" align="center">ON20</td>
<td valign="middle" align="center">36.67 &#xb1; 0.75c</td>
<td valign="middle" align="center">4.00 &#xb1; 0.03b</td>
<td valign="middle" align="center">128.05 &#xb1; 0.75b</td>
</tr>
<tr>
<td valign="middle" align="center">ON30</td>
<td valign="middle" align="center">30.99 &#xb1; 0.97d</td>
<td valign="middle" align="center">4.66 &#xb1; 0.07a</td>
<td valign="middle" align="center">136.28 &#xb1; 1.52a</td>
</tr>
<tr>
<td valign="middle" align="center">ON40</td>
<td valign="middle" align="center">34.62 &#xb1; 0.83cd</td>
<td valign="middle" align="center">4.23 &#xb1; 0.02ab</td>
<td valign="middle" align="center">121.98 &#xb1; 1.52cd</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3_5">
<label>3.5</label>
<title>Oil content score</title>
<p>Oil content scores of cured upper leaves displayed a non-linear response to organic nitrogen (<xref ref-type="fig" rid="f3"><bold>Figure 3</bold></xref>). ON30 and ON40 achieved the highest scores, both significantly exceeding ON0.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Oil content scores of cured tobacco leaves under different organic nitrogen ratios (original data). The plot displays the oil content scores for each of the five treatments, which correspond to organic nitrogen to total nitrogen ratios of ON0 (0%), ON10 (10%), ON20 (20%), ON30 (30%), and ON40 (40%). Each small point represents an individual replicate score (n=3), while the large colored circle represents the mean score for that treatment. Error bars indicate the standard deviation (SD). An asterisk (*) denotes a statistically significant difference between the indicated groups (p&lt; 0.05), as determined by one-way ANOVA followed by Duncan&#x2019;s multiple range test.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767538-g003.tif">
<alt-text content-type="machine-generated">Scatter plot with error bars compares oil content for ON0, ON10, ON20, ON30, and ON40 groups. Oil content increases from ON0 to ON40, with significant differences indicated by asterisks and p &#x2264; 0.05.</alt-text>
</graphic></fig>
</sec>
<sec id="s3_6">
<label>3.6</label>
<title>Correlation analysis</title>
<p>Spearman correlation analysis (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4</bold></xref>) was conducted to explore the relationships among oil content and physicochemical indicators. As shown in the heatmap, oil content exhibited significant positive correlations (p&lt; 0.05) with PEE, FAS, TS, RS, Glandular trichomes density (GT), CBT-diol, PEPC, PAP, and tensile strength (TsS). Conversely, it showed significant negative correlations with PA content and softness value (Sof). Notably, strong multicollinearity was observed between certain features, such as TS and RS, necessitating feature selection for subsequent modeling.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Spearman correlation analysis of physicochemical indicators and oil content. The heatmap displays the pairwise Spearman&#x2019;s rank correlation coefficients. The color gradient represents the correlation coefficient value, with red indicating a positive correlation and blue indicating a negative correlation. Asterisks denote statistical significance (*p&lt; 0.05, **p&lt; 0.01, ***p&lt; 0.001). PA: Pyruvic acid, TP: Total phenols, PEE: Petroleum ether extract, TS: Total sugar, RS: Reducing sugar, GT: Glandular trichomes density, CBT-diol: Cembratriene-diol, SE: Sucrose esters, FAS: Fatty acid synthase, PEPC: Phosphoenolpyruvate carboxylase, PAP: Phosphatidic acid phosphatase, Sof: Softness, TsS: Tensile strength, Thk: Thickness.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767538-g004.tif">
<alt-text content-type="machine-generated">Triangular correlation matrix heatmap showing correlations among fourteen variables, with blue representing negative correlations and red representing positive correlations. Statistical significance is indicated by asterisks within the colored squares. A vertical color scale bar from negative one to positive one is displayed to the right.</alt-text>
</graphic></fig>
</sec>
<sec id="s3_7">
<label>3.7</label>
<title>Random forest model performance and diagnostics</title>
<p>To construct a robust predictive model despite the limited sample size, we employed a data augmentation strategy combined with rigorous feature selection, and encoded the treatments as 0, 10, 20, 30, 40.</p>
<p>Recursive Feature Elimination (RFE) with cross-validation was first applied to the augmented dataset. As shown in <xref ref-type="fig" rid="f5"><bold>Figures&#xa0;5A, the</bold></xref> model&#x2019;s performance stabilized when the number of features was reduced to five. Consequently, PEE, CBT-diol, Sof, RS, and GT were selected as the optimal input features for the final model, effectively reducing redundancy while retaining critical biological information.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Performance and diagnostic plots for the random forest model. All analyses were performed on the augmented dataset. <bold>(A)</bold> RFE Feature Selection Performance, illustrating the cross-validation score (R&#xb2;) as a function of the number of selected features. <bold>(B)</bold> Out-of-Bag (OOB) error curve, showing the smoothed model error rate as the number of estimators (trees) increases. <bold>(C)</bold> Cross-validation predicted versus actual oil content values using the original dataset (N = 15), illustrating the model&#x2019;s inability to generalize due to limited sample size (CV R<sup>2</sup>=&#x2212;0.039). <bold>(D)</bold> Cross-validation predicted versus actual values using the augmented dataset (N = 45), demonstrating significantly improved predictive accuracy and the effectiveness of the augmentation strategy (CV R<sup>2</sup> = 0.819). <bold>(E)</bold> Grid Search Performance (CV R&#xb2;), displaying the impact of max_depth and min_samples_leaf on model accuracy. <bold>(F)</bold> Residuals Distribution, showing the frequency of residual values with a fitted normal distribution curve. <bold>(G)</bold> Quantile-Quantile (Q-Q) plot of the CV residuals against a theoretical normal distribution. <bold>(H)</bold> Sensitivity of Model Performance to Data Augmentation Noise, demonstrating the stability of OOB R&#xb2; across different noise levels.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767538-g005.tif">
<alt-text content-type="machine-generated">Panel A: Line graph showing cross-validation R squared score versus number of features, with scores slightly decreasing as features increase from five to eleven. Panel B: Line graph of out-of-bag error versus number of estimators, demonstrating rapid error reduction followed by plateauing. Panel C: Scatter plot of predicted versus actual oil content with a CV R squared of negative zero point zero three nine, showing little correlation. Panel D: Scatter plot of predicted versus actual oil content with a CV R squared of zero point eight one nine, showing strong positive correlation. Panel E: Heatmap displaying CV R squared scores for varying combinations of max depth and minimum samples per leaf, with values ranging from zero point seven nine two to zero point eight two zero. Panel F: Histogram of residuals with an overlaid density curve, indicating most residuals are near zero. Panel G: Quantile-quantile plot comparing ordered values to theoretical quantiles, with most points near the reference line except a few outliers. Panel H: Line graph of out-of-bag R squared score declining as noise level increases from one percent to ten percent.</alt-text>
</graphic></fig>
<p>The Random Forest model trained on this optimized feature set and augmented data demonstrated excellent performance. Grid search optimization (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5E</bold></xref>) identified the optimal hyperparameters (e.g., n_estimators=300, max_depth=10, min_samples_leaf=1), which were used for the final training. The model achieved an OOB R&#xb2; of 0.781 and a 3-fold CV R&#xb2; of 0.819. In stark contrast, the model trained on the original small dataset (N = 15) failed to generalize, yielding a negative CV R&#xb2; (-0.039) (<xref ref-type="fig" rid="f5"><bold>Figures&#xa0;5C, D</bold></xref>). This comparison underscores the necessity and effectiveness of our data augmentation strategy. The OOB error curve (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5B</bold></xref>) further confirmed that the error rate stabilized and minimized around 150&#x2013;200 trees, validating the sufficiency of setting n_estimators to 300.</p>
<p>Model diagnostics indicated that the assumptions for regression were met. The distribution of residuals was approximately normal (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5F</bold></xref>), and the Q-Q plot (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5G</bold></xref>) showed that the standardized residuals aligned well with the theoretical quantiles, with no significant deviations. Sensitivity analysis (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5H</bold></xref>) demonstrated that the model&#x2019;s performance remained relatively stable across different noise levels (1% - 3%) used in augmentation, although performance degraded at very high noise levels (10%), confirming the appropriateness of the chosen 3% noise parameter.</p>
</sec>
<sec id="s3_8">
<label>3.8</label>
<title>Identification of key physicochemical indicators</title>
<p>Feature importance analysis based on Mean Decrease in Impurity (MDI) (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6</bold></xref>) revealed the relative contribution of each indicator to the oil content prediction. PEE was identified as the most influential predictor, followed closely by CBT-diol and Sof. The feature importance rankings between the trained models based on the raw data and enhanced data are almost consistent, further verifying the robustness of identifying key features.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Feature importance comparison. This bar chart compares the importance of features derived from the Random Forest model trained on the original dataset versus the augmented dataset. The importance is measured by the Mean Decrease in Impurity (MDI). PA: Pyruvic acid, PEE: Petroleum ether extract, GT: Glandular trichomes density, CBT-diol: Cembratriene-diol, Sof: Softness.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767538-g006.tif">
<alt-text content-type="machine-generated">Bar chart comparing feature importance for five features (PA, PEE, GT, CBT-diol, Sof) between original and augmented datasets, showing PEE as most important in both, with original consistently higher except for PA and Sof.</alt-text>
</graphic></fig>
</sec>
<sec id="s3_9">
<label>3.9</label>
<title>Mechanistic interpretation of key indicators&#x2019; effects on tobacco oil content</title>
<p>To gain a deeper understanding of how key indicators influence oil content, we interpreted the RF model using Partial Dependence Plots (PDP) and SHAP value analysis.</p>
<p>The PDP (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7</bold></xref>) revealed the marginal effects of the top five features. PEE and CBT-diol demonstrated strong positive associations with oil content: as their values increased, the predicted oil content score rose sharply before leveling off, suggesting a saturation effect. GT also showed a positive trend. In contrast, Sof exhibited a clear negative relationship, where lower softness values (indicating softer leaves) were associated with higher oil scores. PA showed a threshold effect, where oil scores dropped significantly when PA content exceeded a certain level.</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Partial dependence plots (PDP) of key indicators on predicted oil content with inflection points. The panels display the marginal effects of the top five features on the predicted oil content score, as determined by the Random Forest model trained on the augmented dataset. The y-axis represents the average partial dependence, and the x-axis corresponds to the value of each feature on its original scale. Red dots indicate the primary inflection points (points of maximum gradient change), with their specific values annotated, highlighting critical thresholds where feature influence shifts most dramatically. Rug plots at the bottom show the distribution of the augmented data points. PEE: Petroleum ether extract, CBT-diol: Cembratriene-diol, PA: Pyruvic acid, Sof: Softness, GT: Glandular trichomes density.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767538-g007.tif">
<alt-text content-type="machine-generated">Grouped partial dependence plots for five variables&#x2014;PEE, CBT-diol, PA, Sof, and GT&#x2014;each with a blue line illustrating effect trends, marked with a red dot, arrow, and associated threshold value in red text.</alt-text>
</graphic></fig>
<p>SHAP analysis provided further insights into individual feature contributions and interactions. The SHAP summary plot (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8A</bold></xref>) confirmed the global importance trends, showing that high values of PEE, CBT-diol, and GT had a positive impact on the model output (pushing it to the right), while high values of Sof and PA had a negative impact. We further explored the interactions among the top four features using SHAP dependence plots (<xref ref-type="fig" rid="f8"><bold>Figures&#xa0;8B&#x2013;E</bold></xref>), which revealed that the influence of individual indicators is highly context-dependent. For instance, the positive contribution of PEE to oil content was notably modulated by CBT-diol, specifically, samples characterized by both high PEE and high CBT-diol levels exhibited elevated SHAP values, suggesting a synergistic effect between these lipid-related metabolites. A similar but negative, more complex, interaction was observed between CBT-diol and leaf softness. Differently, the negative effects of Sof and PA on oil content were found to vary depending on the levels of PEE and Sof, respectively. These results underscore that tobacco oil content is not determined by single factors in isolation, but rather by the complex interplay among lipid metabolites, physical properties, and precursor availability.</p>
<fig id="f8" position="float">
<label>Figure&#xa0;8</label>
<caption>
<p>SHAP value analysis of the random forest model. <bold>(A)</bold> SHAP Summary Plot. Each point represents a single sample. The position on the y-axis indicates the feature, and the position on the x-axis indicates the SHAP value (impact on model output). The color represents the feature value (red for high, blue for low). <bold>(B-E)</bold> SHAP Dependence Plots Illustrating Interaction Effects. Each panel plots the SHAP value of a primary feature against its own value. The color of the points is determined by the value of a second, interacting feature. <bold>(B)</bold> SHAP dependence for PEE colored by CBT-diol. <bold>(C)</bold> SHAP dependence for CBT-diol colored by Sof. <bold>(D)</bold> SHAP dependence for PA colored by PEE. <bold>(E)</bold> SHAP dependence for Sof colored by PEE. PEE: Petroleum ether extract, CBT-diol: Cembratriene-diol, PA: Pyruvic acid, Sof: Softness, GT: Glandular trichomes density.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767538-g008.tif">
<alt-text content-type="machine-generated">Panel A displays a SHAP summary dot plot showing feature importance for five variables (PEE, CBT-diol, PA, Sof, GT) with SHAP values on the x-axis and feature value from low (blue) to high (pink). Panels B through E show individual SHAP dependence scatter plots for PEE, CBT-diol, PA, and Sof, respectively, each illustrating how varying feature values influence their SHAP values and model output, with color indicating another feature's values.</alt-text>
</graphic></fig>
</sec>
<sec id="s3_10">
<label>3.10</label>
<title>Data structure and model</title>
<p>t-SNE visualization (<xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9</bold></xref>) was employed to explore the underlying data structure. <xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9A</bold></xref> shows that samples from different organic nitrogen treatments (ON0-ON40) formed distinct clusters or gradients in the 2D space, confirming that the selected five features contain sufficient information to distinguish between treatments. <xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9B</bold></xref> displays the features in the t-SNE space, colored by their importance. The proximity of certain features (e.g., GT and CBT-diol) suggests they may share similar information or biological roles in determining leaf quality.</p>
<fig id="f9" position="float">
<label>Figure&#xa0;9</label>
<caption>
<p>t-SNE dimensionality reduction visualization of augmented data. <bold>(A)</bold> t-SNE plot of the augmented samples (N = 45), colored by their respective organic nitrogen treatment level (% Org. N). This visualization confirms that the data augmentation strategy preserved the distinct clustering patterns of different treatments in the high-dimensional feature space. <bold>(B)</bold> t-SNE plot of the physicochemical features, colored by their feature importance score from the Random Forest model. Proximity between features may suggest similar functional roles or response patterns. PA, Pyruvic acid; PEE, Petroleum ether extract; GT, Glandular trichomes density; CBT-diol, Cembratriene-diol; Sof, Softness.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767538-g009.tif">
<alt-text content-type="machine-generated">Panel A is a scatter plot displaying sample t-SNE dimensions, with points colored by five different treatment groups. Panel B is a scatter plot of feature t-SNE dimensions, with feature importance indicated by point color and size, and corresponding feature names labeled.</alt-text>
</graphic></fig>
<p>Finally, we compared the treatment levels with the RF model&#x2019;s cross-validation predictions (<xref ref-type="fig" rid="f10"><bold>Figure&#xa0;10</bold></xref>). The average predicted oil content for each treatment level accurately reproduced the non-linear trend observed in the actual field experiment: rising from ON0 to a peak at ON30, and then slightly declining at ON40. This confirms that our machine learning model successfully captured the true biological response of tobacco oil content to varying organic nitrogen application ratios.</p>
<fig id="f10" position="float">
<label>Figure&#xa0;10</label>
<caption>
<p>Relationship between treatment level and cross-validated predictions of oil content (augmented data). The plot displays the cross-validation (CV) predicted oil content scores from the Random Forest model for each sample in the augmented dataset (N = 45) under different organic nitrogen ratios. Each point represents a single augmented sample, with its color indicating the predicted oil content value. The dashed red line connects the average predicted oil content for each treatment level, illustrating the overall trend captured by the model.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767538-g010.tif">
<alt-text content-type="machine-generated">Scatterplot with grouped color-coded points showing predicted oil content versus organic nitrogen ratio percentage, overlaid with a red dashed line for average prediction and a legend labeled Average Prediction in the upper right corner.</alt-text>
</graphic></fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<sec id="s4_1">
<label>4.1</label>
<title>Glandular trichomes and secretions as primary drivers of oil content</title>
<p>The secretory trichomes (glandular trichomes) on the leaf surface of flue-cured tobacco at specific developmental stages are a key factor influencing oil content and overall quality. Glandular trichomes are the sites for the synthesis and secretion of numerous very-long-chain fatty acids, their derivatives, and alicyclic compounds (<xref ref-type="bibr" rid="B26">Philippe et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B36">Wang, 2014</xref>). Among these, cembratriene-diol and sucrose esters are important secretions of the glandular trichomes. Both are crucial aroma precursors that can impart desirable aroma and sweetness to flue-cured tobacco (<xref ref-type="bibr" rid="B29">Qu et&#xa0;al., 2018</xref>), and they enhance the &#x201c;oily&#x201d; sensation of the leaf surface, contributing to the improvement of the tobacco&#x2019;s appearance quality. As the primary secretory organs for terpenoids, an increased density of long-stalked glandular trichomes directly thickens the waxy layer on the leaf surface, thereby enhancing the tactile perception of oiliness (e.g., smoothness) and the aroma (<xref ref-type="bibr" rid="B38">Wang et&#xa0;al., 2022</xref>). In this study, all treatments with increased organic nitrogen ratios showed significantly greater densities of all types of glandular trichomes and higher secretion contents compared to the control. Notably, in ON30, the density of long-stalked glandular trichomes increased by 53.24% compared to ON0, with a concurrent significant rise in the contents of CBT-diol and sucrose ester secretions. This is likely the reason why the final oil content score for ON30 was significantly higher than that for ON0. Our Random Forest model further validated this biological observation: Recursive Feature Elimination (RFE) identified both Glandular Trichome density (GT) and CBT-diol content as top-tier predictors (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5A</bold></xref>), confirming their indispensable role in determining the final oil score. Some researchers suggest that the content of glandular trichome secretions may be related to the regulation of cell wall structure by the combined application of organic nitrogen (<xref ref-type="bibr" rid="B44">Zhou et&#xa0;al., 2024</xref>). For instance, the increased leaf thickness observed in ON30 might enhance the mechanical strength of the leaf, reducing physical damage to the trichomes during growth and thus allowing for the retention of more secretions. However, this mechanism requires further verification.</p>
</sec>
<sec id="s4_2">
<label>4.2</label>
<title>Lipid metabolism as a core biochemical pathway</title>
<p>Carbohydrate-derived pyruvic acid (PA) serves as a centralxnode linking glycolysis to lipid biosynthesis, acting as a precursor for acetyl-CoA, fatty acid chains, sterols, and terpenes via the tricarboxylic acid (TCA) cycle and methylerythritol phosphate (MEP) pathway (<xref ref-type="bibr" rid="B22">Li-Beisson et&#xa0;al., 2010</xref>). The synthesis of TP, secondary metabolites derived from PA metabolism, competes with lipid synthesis for common precursors like phosphoenolpyruvate (PEP). In ON30, PA levels declined sharply (&#x2212;17.6%), suggesting enhanced carbon flux toward acetyl-CoA and downstream lipid synthesis (<xref ref-type="table" rid="T2"><bold>Table&#xa0;2</bold></xref>). This reduction is consistent with the hypothesis that carbon flux may be reallocated from the PA pool towards acetyl-CoA via the TCA cycle for lipid synthesis or towards other downstream products (<xref ref-type="bibr" rid="B11">Chen and Zhu, 2023</xref>), although this metabolic flux shift is inferred from static concentration changes. The enhancement of this metabolic pathway might indirectly lead to the downregulation of the phenylpropanoid pathway, thus explaining the decrease in TP content. PEPC is a key enzyme in carbon fixation and the supply of precursors for amino acid and organic acid synthesis, influencing overall metabolic flux and ultimately affecting the production of secondary metabolites (<xref ref-type="bibr" rid="B1">Baena et&#xa0;al., 2021</xref>). An increase in its activity not only accelerates the conversion of PA but also promotes the accumulation of TS and RS by enhancing carbon-nitrogen synergy. FAS plays a central role in the <italic>de novo</italic> synthesis of fatty acids, and its increased activity directly promotes fatty acid accumulation (<xref ref-type="bibr" rid="B20">Kitajima-Koga et&#xa0;al., 2020</xref>). Meanwhile, PAP is involved in lipid metabolism and the regulation of phospholipid levels, and the reactions it participates in are crucial steps in the synthesis and storage of triacylglycerols (<xref ref-type="bibr" rid="B35">Torres-Rodr&#xed;guez et&#xa0;al., 2021</xref>). This study found that ON30 significantly enhanced the activities of FAS, PAP, and PEPC, which is likely a key factor contributing to the significant increase in the oil content score for this treatment. The significant increase in PEE content in ON30 and its strong correlation with oil content further corroborate this conclusion, as PEE comprises nearly all secondary metabolites in tobacco leaves (<xref ref-type="bibr" rid="B19">Jiang et&#xa0;al., 2025</xref>) and is often used as a proxy indicator for the &#x201c;oil content&#x201d; of flue-cured tobacco. However, a notable decline in enzyme activities (FAS, PEPC) and lipid metabolites (PEE, CBT-diol) was observed at the highest organic nitrogen level (ON40). This &#x201c;diminishing return&#x201d; or inhibitory effect likely stems from the carbon-nitrogen imbalance hypothesis. Excessive organic nitrogen input in ON40 may lead to an overabundance of nitrogen relative to carbon skeletons. According to the C/N balance theory, plants prioritize carbon resources for amino acid and protein synthesis to assimilate excess nitrogen, thereby diverting acetyl-CoA away from the lipid biosynthesis pathway (<xref ref-type="bibr" rid="B15">Fritz et&#xa0;al., 2006</xref>). Additionally, the significantly lower soil pH observed under high organic loading (ON40) might create a sub-optimal rhizosphere environment, suppressing the activity of soil microorganisms and root enzymes essential for nutrient uptake and metabolism (<xref ref-type="bibr" rid="B14">Feng et&#xa0;al., 2023</xref>). Meanwhile, it is crucial to acknowledge a potential spatial mismatch: while our enzyme activity assays represent whole-leaf protein levels, lipid biosynthesis relevant to &#x201c;oiliness&#x201d; is highly concentrated in the glandular trichomes. Future studies utilizing trichome-specific metabolite profiling are needed to directly link enzyme expression with localized lipid accumulation.</p>
</sec>
<sec id="s4_3">
<label>4.3</label>
<title>Synergistic effects of leaf physical properties</title>
<p>The sensory evaluation of oil content depends not only on chemical composition but is also closely related to the physical properties of the tobacco leaf (<xref ref-type="bibr" rid="B6">Cai et&#xa0;al., 2023</xref>). In our study, ON30 significantly reduced the softness value (<xref ref-type="table" rid="T3"><bold>Table&#xa0;3</bold></xref>), indicating that the leaves from this treatment were softer, which is consistent with the typical tactile characteristics of high-oil-content leaves (<xref ref-type="bibr" rid="B21">Li et&#xa0;al., 2008</xref>). The increase in tensile strength reflects an optimization of the leaf&#x2019;s fibrous structure, which may be attributed to the regulation of cell wall components (such as cellulose and pectin) by the combined application of organic nitrogen (<xref ref-type="bibr" rid="B24">Ogden et&#xa0;al., 2018</xref>). Furthermore, the significant increase in leaf thickness for ON30, while remaining within the standard range (120-140 &#x3bc;m), ensured both good combustion performance and avoided difficulties in rolling due to excessive thickness. These physical traits contribute directly to the perception of oiliness, highlighting the multifactorial nature of oil content, where chemical and structural factors act synergistically. The deterioration of these physical traits (increased hardness, decreased thickness) in ON40 further supports the notion of a physiological stress response to nutrient over-supply, where rapid vegetative growth might occur at the expense of structural refinement and secondary metabolite accumulation. Importantly, our RF model identified Softness (Sof) as a top-three predictor. While softness itself is a physical state rather than a metabolic driver like FAS, it serves as a critical &#x201c;accompanying trait&#x201d; that integrates the outcomes of cell wall structure and moisture retention, making it a reliable indicator for sensory quality.</p>
</sec>
<sec id="s4_4">
<label>4.4</label>
<title>Insights from random forest model</title>
<p>Despite the inherent challenges of small sample sizes in agricultural field trials, the Random Forest (RF) model, augmented with a rigorous data generation strategy (noise injection and linear interpolation), demonstrated robust explanatory power. The stark contrast between the poor performance on original data (CV R&#xb2; = -0.039) and the high accuracy on augmented data (CV R&#xb2; = 0.819) highlights the necessity of data augmentation in capturing latent biological patterns that are otherwise obscured by limited sampling (<xref ref-type="bibr" rid="B33">Shorten and Khoshgoftaar, 2019</xref>). By integrating RFE for feature selection, we distilled the model down to five core indicators&#x2014;PEE, CBT-diol, Sof, PA, and GT&#x2014;which collectively explain the majority of the variance in oil content.</p>
<p>The feature importance analysis (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6</bold></xref>) and PDP (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7</bold></xref>) quantified the relative contributions of these markers. PEE and CBT-diol emerged as the most dominant positive drivers, confirming that the abundance of lipid-related metabolites is the material basis of oiliness. Interestingly, PA exhibited a threshold-dependent negative effect, consistent with its role as a transient metabolic precursor that is depleted during active lipid synthesis (<xref ref-type="bibr" rid="B42">Zeng et&#xa0;al., 2025</xref>).</p>
<p>Crucially, the SHAP interaction analysis (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8</bold></xref>) moved beyond single-factor effects to reveal context-dependent regulation. We observed that the positive contribution of PEE to oil content was synergistic with CBT-diol levels. This reflects the physiological reality where PEE (a solvent mixture) and CBT-diol (a specific solute) co-vary to determine the sensory &#x201c;oiliness.&#x201d; Similarly, the negative impact of Softness appeared to be modulated by PEE levels, suggesting that high lipid content might partially compensate for less-than-ideal leaf texture. These non-linear and interactive insights provide a more nuanced understanding of quality formation than traditional linear correlation analyses.</p>
</sec>
<sec id="s4_5">
<label>4.5</label>
<title>Study limitations and future directions</title>
<p>While this study offers valuable insights into the regulation of tobacco oil content, several limitations must be acknowledged. First, the field experiment was conducted at a single location over one growing season. Given the known influence of environmental factors (temperature, rainfall, soil type) on secondary metabolism, multi-year and multi-location trials are necessary to validate the generalizability of the optimal 30% organic nitrogen ratio. Second, although the data augmentation strategy successfully mitigated overfitting and improved model convergence (as evidenced by the OOB error curve), the original sample size (N = 15 biological replicates) remains small for machine learning applications. The findings should be interpreted as exploratory hypothesis generation rather than definitive predictive rules. Future research should prioritize larger-scale datasets and incorporate multi-omics approaches (transcriptomics and metabolomics) to construct a comprehensive regulatory network spanning genes, metabolites, and sensory traits.</p>
</sec>
</sec>
<sec id="s5" sec-type="conclusions">
<label>5</label>
<title>Conclusion</title>
<p>In conclusion, this study demonstrates that optimizing the organic nitrogen ratio, particularly at 30%, enhances flue-cured tobacco oil content via coordinated effects on glandular trichome development, lipid metabolism, and leaf physical properties. By integrating field experiments with a Random Forest model trained on augmented data, we successfully captured the non-linear, interactive pathways underpinning oil content regulation. PEE, CBT-diol, and Softness emerged as the most robust indicators, with PEE and CBT-diol acting as primary material drivers and Softness serving as a key accompanying physical trait. These findings establish a data-driven framework for improving tobacco leaf quality and provide a theoretical basis for precise nitrogen management. Future work should focus on validating these mechanisms across diverse production environments and employing gland-specific metabolic profiling.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material</bold></xref>. Further inquiries can be directed to the corresponding authors.</p></sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>ZS: Conceptualization, Data curation, Formal analysis, Validation, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. WJ: Conceptualization, Software, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. HL: Formal analysis, Writing &#x2013; review &amp; editing. YL: Funding acquisition, Writing &#x2013; review &amp; editing. XY: Investigation, Writing &#x2013; review &amp; editing. CP: Resources, Writing &#x2013; review &amp; editing. LS: Funding acquisition, Writing &#x2013; review &amp; editing. QY: Validation, Writing &#x2013; review &amp; editing. JF: Project administration, Supervision, Writing &#x2013; review &amp; editing. JC: Conceptualization, Methodology, Writing &#x2013; review &amp; editing. SD: Conceptualization, Funding acquisition, Writing &#x2013; review &amp; editing.</p></sec>
<ack>
<title>Acknowledgments</title>
<p>Thanks for the assistance in revising the article by Professor Ling Yuan from Tobacco Research and Development Center at the University of Kentucky.</p>
</ack>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>YL, XY, CP, LS, QY, JF were employed by company China Tobacco Guangdong Industrial Co., Ltd.</p>
<p>The remaining author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
<sec id="s10" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec id="s11" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p></sec>
<sec id="s12" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2026.1767538/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2026.1767538/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="DataSheet1.zip" id="SM1" mimetype="application/zip"/>
<supplementary-material xlink:href="Table1.xlsx" id="SF1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table2.xlsx" id="SF2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Baena</surname> <given-names>G.</given-names></name>
<name><surname>Feria</surname> <given-names>A. B.</given-names></name>
<name><surname>Hern&#xe1;ndez-Huertas</surname> <given-names>L.</given-names></name>
<name><surname>Gandullo</surname> <given-names>J.</given-names></name>
<name><surname>Echevarr&#xed;a</surname> <given-names>C.</given-names></name>
<name><surname>Monreal</surname> <given-names>J. A.</given-names></name>
<etal/>
</person-group>. (<year>2021</year>). 
<article-title>Genetic and pharmacological inhibition of autophagy increases the monoubiquitination of non-photosynthetic phosphoenolpyruvate carboxylase</article-title>. <source>Plants.</source> <volume>10</volume>, <elocation-id>12</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/plants10010012</pub-id>, PMID: <pub-id pub-id-type="pmid">33374865</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>B&#xe9;nard</surname> <given-names>C.</given-names></name>
<name><surname>Veiga</surname> <given-names>S. D.</given-names></name>
<name><surname>Scornet</surname> <given-names>E.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>Mean decrease accuracy for random forests: inconsistency, and a practical solution via the Sobol-MDA</article-title>. <source>Biometrika.</source> <volume>109</volume>, <fpage>881</fpage>&#x2013;<lpage>900</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/biomet/asac017</pub-id>, PMID: <pub-id pub-id-type="pmid">36970824</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bender</surname> <given-names>S. F.</given-names></name>
<name><surname>Schulz</surname> <given-names>S.</given-names></name>
<name><surname>Mart&#xed;nez-Cuesta</surname> <given-names>R.</given-names></name>
<name><surname>Laughlin</surname> <given-names>R. J.</given-names></name>
<name><surname>Kublik</surname> <given-names>S.</given-names></name>
<name><surname>Pfeiffer-Zakharova</surname> <given-names>K.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title>Simplification of soil biota communities impairs nutrient recycling and enhances above- and belowground nitrogen losses</article-title>. <source>New Phytol.</source> <volume>240</volume>, <fpage>2020</fpage>&#x2013;<lpage>2034</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/nph.19252</pub-id>, PMID: <pub-id pub-id-type="pmid">37700504</pub-id>
</mixed-citation>
</ref>
<ref id="B4">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bouni</surname> <given-names>M.</given-names></name>
<name><surname>Hssina</surname> <given-names>B.</given-names></name>
<name><surname>Douzi</surname> <given-names>K.</given-names></name>
<name><surname>Douzi</surname> <given-names>S.</given-names></name>
</person-group> (<year>2024</year>). 
<article-title>Interpreta ble machine learning techniques for an advanced crop recommendation model</article-title>. <source>J. Electr. Comput. Eng.</source> <volume>2024</volume>, <elocation-id>7405217</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1155/2024/7405217</pub-id>, PMID: <pub-id pub-id-type="pmid">41641447</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bureau</surname> <given-names>A.</given-names></name>
<name><surname>Dupuis</surname> <given-names>J.</given-names></name>
<name><surname>Falls</surname> <given-names>K.</given-names></name>
<name><surname>Lunetta</surname> <given-names>K. L.</given-names></name>
<name><surname>Hayward</surname> <given-names>B.</given-names></name>
<name><surname>Keith</surname> <given-names>T. P.</given-names></name>
<etal/>
</person-group>. (<year>2005</year>). 
<article-title>Identifying SNPs predictive of phenotype using random forests</article-title>. <source>Genet. Epidemiol.</source> <volume>28</volume>, <fpage>171</fpage>&#x2013;<lpage>182</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/gepi.20041</pub-id>, PMID: <pub-id pub-id-type="pmid">15593090</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Cai</surname> <given-names>C. C.</given-names></name>
<name><surname>Wu</surname> <given-names>C. L.</given-names></name>
<name><surname>Cheng</surname> <given-names>J. Q.</given-names></name>
<name><surname>Li</surname> <given-names>Y. P.</given-names></name>
<name><surname>Yang</surname> <given-names>J.</given-names></name>
<name><surname>Ren</surname> <given-names>X. H.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>Research progress and prospect of oil in tobacco leaf</article-title>. <source>Hubei Agric. Sci.</source> <volume>62</volume>, <fpage>1</fpage>&#x2013;<lpage>6</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.14088/j.cnki.issn0439-8114.2023.S1.001</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Carman</surname> <given-names>G. M.</given-names></name>
<name><surname>Han</surname> <given-names>G.</given-names></name>
</person-group> (<year>2006</year>). 
<article-title>Roles of phosphatidate phosphatase enzymes in lipid metabolism</article-title>. <source>Trends Biochem. Sci.</source> <volume>31</volume>, <fpage>694</fpage>&#x2013;<lpage>699</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.tibs.2006.10.003</pub-id>, PMID: <pub-id pub-id-type="pmid">17079146</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Carman</surname> <given-names>G. M.</given-names></name>
<name><surname>Han</surname> <given-names>G.</given-names></name>
</person-group> (<year>2009</year>). 
<article-title>Phosphatidic acid phosphatase, a key enzyme in the regulation of lipid synthesis</article-title>. <source>J. Biol. Chem.</source> <volume>284</volume>, <fpage>2593</fpage>&#x2013;<lpage>2597</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1074/jbc.R800059200</pub-id>, PMID: <pub-id pub-id-type="pmid">18812320</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Chen</surname> <given-names>Y. J.</given-names></name>
<name><surname>Ren</surname> <given-names>K.</given-names></name>
<name><surname>He</surname> <given-names>X.</given-names></name>
<name><surname>Gong</surname> <given-names>J. S. Q.</given-names></name>
<name><surname>Hu</surname> <given-names>X. D.</given-names></name>
<name><surname>Su</surname> <given-names>J. E.</given-names></name>
<etal/>
</person-group>. (<year>2019</year>). 
<article-title>Dynamic changes in physiological and biochemical properties of flue-cured tobacco of different leaf ages during flue-curing and their effects on yield and quality</article-title>. <source>BMC Plant Biol.</source> <volume>19</volume>, <fpage>555</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12870-019-2143-x</pub-id>, PMID: <pub-id pub-id-type="pmid">31842767</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Chen</surname> <given-names>Y. C.</given-names></name>
<name><surname>Wang</surname> <given-names>S. B.</given-names></name>
<name><surname>He</surname> <given-names>X. X.</given-names></name>
<name><surname>Gao</surname> <given-names>J. P.</given-names></name>
<name><surname>Zhang</surname> <given-names>X. Y.</given-names></name>
<name><surname>Huang</surname> <given-names>P. J.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>Metabolomic and transcriptomic analyses reveal differences in fatty acids in tobacco leaves across cultivars and developmental stages</article-title>. <source>BMC Plant Biol.</source> <volume>25</volume>, <fpage>312</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12870-025-06337-9</pub-id>, PMID: <pub-id pub-id-type="pmid">40069610</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Chen</surname> <given-names>C.</given-names></name>
<name><surname>Zhu</surname> <given-names>S. H.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>&#x3b2;-Cyclodextrin-based nitrosoglutathione improves the storage quality of peach by regulating the metabolism of endogenous nitric oxide, hydrogen sulfide, and phenylpropane</article-title>. <source>Phyton-Int. J. Exp. Bot.</source> <volume>92</volume>, <fpage>1091</fpage>&#x2013;<lpage>1107</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.32604/phyton.2023.026331</pub-id>, PMID: <pub-id pub-id-type="pmid">40612875</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Dinesh</surname> <given-names>P.</given-names></name>
<name><surname>Nikita</surname> <given-names>B.</given-names></name>
<name><surname>Saurav</surname> <given-names>D.</given-names></name>
<name><surname>Arash</surname> <given-names>G.</given-names></name>
</person-group> (<year>2024</year>). 
<article-title>Rooted in nature: the rise, challenges, and potential of organic farming and fertilizers in agroecosystems</article-title>. <source>Sustainability.</source> <volume>16</volume>, <elocation-id>1530</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/su16041530</pub-id>, PMID: <pub-id pub-id-type="pmid">41725453</pub-id>
</mixed-citation>
</ref>
<ref id="B13">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Fan</surname> <given-names>Z. Q.</given-names></name>
<name><surname>Li</surname> <given-names>J. Y.</given-names></name>
<name><surname>Lu</surname> <given-names>M. Z.</given-names></name>
<name><surname>Li</surname> <given-names>X. L.</given-names></name>
<name><surname>Yin</surname> <given-names>H. F.</given-names></name>
</person-group> (<year>2013</year>). 
<article-title>Overexpression of phosphoenolpyruvate carboxylase from Jatropha curcas increases fatty acid accumulation in Nicotiana tabacum</article-title>. <source>Acta Physiol. Plant</source> <volume>35</volume>, <fpage>2269</fpage>&#x2013;<lpage>2279</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11738-013-1264-3</pub-id>, PMID: <pub-id pub-id-type="pmid">41737715</pub-id>
</mixed-citation>
</ref>
<ref id="B14">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Feng</surname> <given-names>Z. W.</given-names></name>
<name><surname>Liu</surname> <given-names>X. D.</given-names></name>
<name><surname>Qin</surname> <given-names>Y. Q.</given-names></name>
<name><surname>Feng</surname> <given-names>G. D.</given-names></name>
<name><surname>Zhou</surname> <given-names>Y.</given-names></name>
<name><surname>Zhu</surname> <given-names>H. H.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title>Cooperation of arbuscular mycorrhizal fungi and bacteria to facilitate the host plant growth dependent on soil pH</article-title>. <source>Front. Microbiol.</source> <volume>14</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmicb.2023.1116943</pub-id>, PMID: <pub-id pub-id-type="pmid">36891386</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Fritz</surname> <given-names>C.</given-names></name>
<name><surname>Palacios-Rojas</surname> <given-names>N.</given-names></name>
<name><surname>Feil</surname> <given-names>R.</given-names></name>
<name><surname>Stitt</surname> <given-names>M.</given-names></name>
</person-group> (<year>2006</year>). 
<article-title>Regulation of secondary metabolism by the carbon&#x2013;nitrogen status in tobacco: nitrate inhibits large sectors of phenylpropanoid metabolism</article-title>. <source>Plant J.</source> <volume>46</volume>, <fpage>533</fpage>&#x2013;<lpage>548</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1365-313X.2006.02715.x</pub-id>, PMID: <pub-id pub-id-type="pmid">16640592</pub-id>
</mixed-citation>
</ref>
<ref id="B16">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Gao</surname> <given-names>Z. T.</given-names></name>
<name><surname>Fu</surname> <given-names>G. M.</given-names></name>
<name><surname>Wang</surname> <given-names>H. Y.</given-names></name>
<name><surname>Wei</surname> <given-names>F. J.</given-names></name>
<name><surname>Chang</surname> <given-names>J. B.</given-names></name>
<name><surname>Yang</surname> <given-names>J. X.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>Comparative analysis of volatile components in tobacco leaves with different oil levels based on TD-GC-MS</article-title>. <source>Jiangsu Agric. Sci.</source> <volume>53</volume>, <fpage>233</fpage>&#x2013;<lpage>240</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.15889/j.issn.1002-1302.2025.13.030</pub-id>
</mixed-citation>
</ref>
<ref id="B17">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Gruber</surname> <given-names>N.</given-names></name>
<name><surname>Galloway</surname> <given-names>J.</given-names></name>
</person-group> (<year>2008</year>). 
<article-title>An earth-system perspective of the global nitrogen cycle</article-title>. <source>Nature.</source> <volume>451</volume>, <fpage>293</fpage>&#x2013;<lpage>296</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nature06592</pub-id>, PMID: <pub-id pub-id-type="pmid">18202647</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>He</surname> <given-names>S. M.</given-names></name>
<name><surname>Zhu</surname> <given-names>G. M.</given-names></name>
<name><surname>Zhou</surname> <given-names>Y.</given-names></name>
<name><surname>Yang</surname> <given-names>B.</given-names></name>
<name><surname>Wang</surname> <given-names>J. P.</given-names></name>
<name><surname>Wang</surname> <given-names>Z. X.</given-names></name>
<etal/>
</person-group>. (<year>2024</year>). 
<article-title>Predictive models for personalized precision medical intervention in spontaneous regression stages of cervical precancerous lesions</article-title>. <source>J. Transl. Med.</source> <volume>22</volume>, <fpage>686</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12967-024-05417-y</pub-id>, PMID: <pub-id pub-id-type="pmid">39061062</pub-id>
</mixed-citation>
</ref>
<ref id="B19">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Jiang</surname> <given-names>W. H.</given-names></name>
<name><surname>Sun</surname> <given-names>Z. J.</given-names></name>
<name><surname>Li</surname> <given-names>H. Y.</given-names></name>
<name><surname>Liang</surname> <given-names>Y. X.</given-names></name>
<name><surname>Yang</surname> <given-names>Q. H.</given-names></name>
<name><surname>Yang</surname> <given-names>X.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>Effects of different selenium fertilizer types and dosages on non-volatile organic acids and aroma substances of flue-cured tobacco</article-title>. <source>Front. Plant Sci.</source> <volume>16</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2025.1659004</pub-id>, PMID: <pub-id pub-id-type="pmid">40918963</pub-id>
</mixed-citation>
</ref>
<ref id="B20">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kitajima-Koga</surname> <given-names>A.</given-names></name>
<name><surname>Baslam</surname> <given-names>M.</given-names></name>
<name><surname>Hamada</surname> <given-names>Y.</given-names></name>
<name><surname>Ito</surname> <given-names>N.</given-names></name>
<name><surname>Taniuchi</surname> <given-names>T.</given-names></name>
<name><surname>Takamatsu</surname> <given-names>T.</given-names></name>
<etal/>
</person-group>. (<year>2020</year>). 
<article-title>Functional analysis of rice long-chain acyl-CoA synthetase 9 (OsLACS9) in the chloroplast envelope membrane</article-title>. <source>Int. J. Mol. Sci.</source> <volume>21</volume>, <elocation-id>2223</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/ijms21062223</pub-id>, PMID: <pub-id pub-id-type="pmid">32210132</pub-id>
</mixed-citation>
</ref>
<ref id="B21">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Li</surname> <given-names>Z. H.</given-names></name>
<name><surname>Liu</surname> <given-names>D. Q.</given-names></name>
<name><surname>Han</surname> <given-names>Z. M.</given-names></name>
<name><surname>Zhou</surname> <given-names>H. L.</given-names></name>
<name><surname>Huang</surname> <given-names>G.</given-names></name>
</person-group> (<year>2008</year>). 
<article-title>Preliminary study on the relationship between oil in flue-cured tobacco and physical and chemical property in tobacco leaves</article-title>. <source>J. Anhui Agric. Sci.</source> <volume>36</volume>, <fpage>1088</fpage>&#x2013;<lpage>1089</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.13989/j.cnki.0517-6611.2008.03.059</pub-id>
</mixed-citation>
</ref>
<ref id="B22">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Li-Beisson</surname> <given-names>Y.</given-names></name>
<name><surname>Shorrosh</surname> <given-names>B.</given-names></name>
<name><surname>Beisson</surname> <given-names>F.</given-names></name>
<name><surname>Andersson</surname> <given-names>M. X.</given-names></name>
<name><surname>Arondel</surname> <given-names>V.</given-names></name>
<name><surname>Bates</surname> <given-names>P. D.</given-names></name>
<etal/>
</person-group>. (<year>2010</year>). 
<article-title>Acyl-lipid metabolism</article-title>. <source>Arabidopsis Book.</source> <volume>11</volume>, <fpage>e0161</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1199/tab.0161</pub-id>, PMID: <pub-id pub-id-type="pmid">23505340</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lu</surname> <given-names>W. D.</given-names></name>
<name><surname>Hao</surname> <given-names>Z. Q.</given-names></name>
<name><surname>Ma</surname> <given-names>X. L.</given-names></name>
<name><surname>Gao</surname> <given-names>J. L.</given-names></name>
<name><surname>Fan</surname> <given-names>X. Q.</given-names></name>
<name><surname>Guo</surname> <given-names>J. F.</given-names></name>
<etal/>
</person-group>. (<year>2024</year>). 
<article-title>Effects of different proportions of organic fertilizer replacing chemical fertilizer on soil nutrients and fertilizer utilization in gray desert soil</article-title>. <source>Agronomy.</source> <volume>14</volume>, <elocation-id>228</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/agronomy14010228</pub-id>, PMID: <pub-id pub-id-type="pmid">41725453</pub-id>
</mixed-citation>
</ref>
<ref id="B24">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ogden</surname> <given-names>M.</given-names></name>
<name><surname>Hoefgen</surname> <given-names>R.</given-names></name>
<name><surname>Roessner</surname> <given-names>U.</given-names></name>
<name><surname>Persson</surname> <given-names>S.</given-names></name>
<name><surname>Khan</surname> <given-names>G. A.</given-names></name>
</person-group> (<year>2018</year>). 
<article-title>Feeding the walls: how does nutrient availability regulate cell wall composition</article-title>? <source>Int. J. Mol. Sci.</source> <volume>19</volume>, <fpage>2691</fpage>.
</mixed-citation>
</ref>
<ref id="B25">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Paramesh</surname> <given-names>V.</given-names></name>
<name><surname>Kumar</surname> <given-names>R. M.</given-names></name>
<name><surname>Rajanna</surname> <given-names>G. A.</given-names></name>
<name><surname>Gowda</surname> <given-names>S.</given-names></name>
<name><surname>Nath</surname> <given-names>A. J.</given-names></name>
<name><surname>Madival</surname> <given-names>Y.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title>Integrated nutrient management for improving crop yields, soil properties, and reducing greenhouse gas emissions</article-title>. <source>Front. Sustain. Food Syst.</source> <volume>7</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fsufs.2023.1173258</pub-id>, PMID: <pub-id pub-id-type="pmid">41738048</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Philippe</surname> <given-names>G.</given-names></name>
<name><surname>Bellis</surname> <given-names>D. D.</given-names></name>
<name><surname>Rose</surname> <given-names>J. K. C.</given-names></name>
<name><surname>Nawrath</surname> <given-names>C.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>Trafficking processes and secretion pathways underlying the formation of plant cuticles</article-title>. <source>Front. Plant Sci.</source> <volume>12</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2021.786874</pub-id>, PMID: <pub-id pub-id-type="pmid">35069645</pub-id>
</mixed-citation>
</ref>
<ref id="B27">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Poltronieri</surname> <given-names>P.</given-names></name>
<name><surname>D&#x2019;Urso</surname> <given-names>O. F.</given-names></name>
</person-group> (<year>2006</year>). &#x201c;
<article-title>Chapter 6 - Tobacco seed oil for biofuels</article-title>,&#x201d; in <source>Biotransformation of agricultural waste and by-products: the food, feed, fibre, fuel (4F) economy</source> (<publisher-loc>Amsterdam</publisher-loc>: 
<publisher-name>Elsevier Inc</publisher-name>). doi:&#xa0;<pub-id pub-id-type="doi">10.1016/B978-0-12-803622-8.00006-9</pub-id>, PMID: <pub-id pub-id-type="pmid">41737640</pub-id>
</mixed-citation>
</ref>
<ref id="B28">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Qiu</surname> <given-names>L. J.</given-names></name>
<name><surname>Li</surname> <given-names>L.</given-names></name>
<name><surname>Zhang</surname> <given-names>X.</given-names></name>
<name><surname>Suo</surname> <given-names>Y. Y.</given-names></name>
<name><surname>Chen</surname> <given-names>Q. L.</given-names></name>
<name><surname>Li</surname> <given-names>Q.</given-names></name>
<etal/>
</person-group>. (<year>2020</year>). 
<article-title>Effects of dosage and ratio of organic and inorganic nitrogen fertilizers on soil biological characteristics and quality of tobacco leaves</article-title>. <source>Chin. J. Soil Sci.</source> <volume>51</volume>, <fpage>920</fpage>&#x2013;<lpage>927</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.19336/j.cnki.trtb.2020.04.22</pub-id>
</mixed-citation>
</ref>
<ref id="B29">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Qu</surname> <given-names>Y. F.</given-names></name>
<name><surname>Xu</surname> <given-names>M. L.</given-names></name>
<name><surname>Cao</surname> <given-names>J. M.</given-names></name>
<name><surname>Sun</surname> <given-names>H. Q.</given-names></name>
<name><surname>You</surname> <given-names>X. W.</given-names></name>
<name><surname>Wang</surname> <given-names>G. P.</given-names></name>
<etal/>
</person-group>. (<year>2018</year>). 
<article-title>Differential analysis of major glandular trichome secretion between different tobacco genotypes</article-title>. <source>Acta Tab. Sin.</source> <volume>24</volume>, <fpage>45</fpage>&#x2013;<lpage>52</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.16472/j.Chinatobacco.2017.096</pub-id>
</mixed-citation>
</ref>
<ref id="B30">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Seifert</surname> <given-names>S.</given-names></name>
<name><surname>Gundlach</surname> <given-names>S.</given-names></name>
<name><surname>Junge</surname> <given-names>O.</given-names></name>
<name><surname>Szymczak</surname> <given-names>S.</given-names></name>
</person-group> (<year>2020</year>). 
<article-title>Integrating biological knowledge and gene expression data using pathway-guided random forests: a benchmarking study</article-title>. <source>Bioinformatics.</source> <volume>36</volume>, <fpage>4301</fpage>&#x2013;<lpage>4308</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btaa483</pub-id>, PMID: <pub-id pub-id-type="pmid">32399562</pub-id>
</mixed-citation>
</ref>
<ref id="B31">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Shang</surname> <given-names>L. R.</given-names></name>
<name><surname>Wan</surname> <given-names>L. Q.</given-names></name>
<name><surname>Zhou</surname> <given-names>X. X.</given-names></name>
<name><surname>Li</surname> <given-names>S.</given-names></name>
<name><surname>Li</surname> <given-names>X. L.</given-names></name>
</person-group> (<year>2020</year>). 
<article-title>Effects of organic fertilizer on soil nutrient status, enzyme activity, and bacterial community diversity in Leymus chinensis steppe in Inner Mongolia, China</article-title>. <source>PloS One</source> <volume>15</volume>, <fpage>e0240559</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0240559</pub-id>, PMID: <pub-id pub-id-type="pmid">33057441</pub-id>
</mixed-citation>
</ref>
<ref id="B32">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Shi</surname> <given-names>Y. W.</given-names></name>
<name><surname>Niu</surname> <given-names>X. X.</given-names></name>
<name><surname>Chen</surname> <given-names>B. Z.</given-names></name>
<name><surname>Pu</surname> <given-names>S. H.</given-names></name>
<name><surname>Ma</surname> <given-names>H. H.</given-names></name>
<name><surname>Li</surname> <given-names>P.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title>). Chemical fertilizer reduction combined with organic fertilizer affects the soil microbial community and diversity and yield of cotton</article-title>. <source>Front. Microbiol.</source> <volume>14</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmicb.2023.1295722</pub-id>, PMID: <pub-id pub-id-type="pmid">38053554</pub-id>
</mixed-citation>
</ref>
<ref id="B33">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Shorten</surname> <given-names>C.</given-names></name>
<name><surname>Khoshgoftaar</surname> <given-names>T. M.</given-names></name>
</person-group> (<year>2019</year>). 
<article-title>A survey on image data augmentation for deep learning</article-title>. <source>J. Big Data.</source> <volume>6</volume>, <fpage>60</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s40537-019-0197-0</pub-id>, PMID: <pub-id pub-id-type="pmid">41731623</pub-id>
</mixed-citation>
</ref>
<ref id="B34">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Swamy</surname> <given-names>S. V.</given-names></name>
<name><surname>Kunar</surname> <given-names>B. M.</given-names></name>
<name><surname>Chandar</surname> <given-names>K. R.</given-names></name>
<name><surname>Alwetaishi</surname> <given-names>M.</given-names></name>
<name><surname>Krishnan</surname> <given-names>S.</given-names></name>
<name><surname>Reddy</surname> <given-names>S.</given-names></name>
</person-group> (<year>2025</year>). 
<article-title>Prediction of uniaxial compressive strength of limestone from ball mill grinding characteristics using supervised machine learning techniques</article-title>. <source>Sci. Rep.</source> <volume>15</volume>, <fpage>28395</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-025-09063-2</pub-id>, PMID: <pub-id pub-id-type="pmid">40759664</pub-id>
</mixed-citation>
</ref>
<ref id="B35">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Torres-Rodr&#xed;guez</surname> <given-names>J. V.</given-names></name>
<name><surname>Salazar-Vidal</surname> <given-names>M. N.</given-names></name>
<name><surname>Ch&#xe1;vez Montes</surname> <given-names>R. A.</given-names></name>
<name><surname>Massange-S&#xe1;nchez</surname> <given-names>J. A.</given-names></name>
<name><surname>Stewart Gillmor</surname> <given-names>C.</given-names></name>
<name><surname>Sawers</surname> <given-names>B. J. H.</given-names></name>
</person-group> (<year>2021</year>). 
<article-title>Low nitrogen availability inhibits the phosphorus starvation response in maize (Zea mays ssp. mays L.)</article-title>. <source>BMC Plant Biol.</source> <volume>21</volume>, <fpage>259</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12870-021-02997-5</pub-id>, PMID: <pub-id pub-id-type="pmid">34090337</pub-id>
</mixed-citation>
</ref>
<ref id="B36">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>G. D.</given-names></name>
</person-group> (<year>2014</year>). 
<article-title>Recent progress in secondary metabolism of plant glandular trichomes</article-title>. <source>Plant Biotechnol.</source> <volume>31</volume>, <fpage>353</fpage>&#x2013;<lpage>361</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5511/plantbiotechnology.14.0701a</pub-id>
</mixed-citation>
</ref>
<ref id="B37">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>S. N.</given-names></name>
<name><surname>Cheng</surname> <given-names>J. K.</given-names></name>
<name><surname>Liao</surname> <given-names>Y. C.</given-names></name>
</person-group> (<year>2020</year>). 
<article-title>Fertilization model for flue-cured tobacco (nicotiana tabacum l.) in southwest China</article-title>. <source>Appl. Ecol. Environ. Res.</source> <volume>18</volume>, <fpage>7853</fpage>&#x2013;<lpage>7863</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.15666/aeer/1806_78537863</pub-id>
</mixed-citation>
</ref>
<ref id="B38">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>Z. J.</given-names></name>
<name><surname>Li</surname> <given-names>X. J.</given-names></name>
<name><surname>Yang</surname> <given-names>Y. F.</given-names></name>
<name><surname>Sun</surname> <given-names>J. P.</given-names></name>
<name><surname>Yang</surname> <given-names>X. L.</given-names></name>
<name><surname>Tian</surname> <given-names>T.</given-names></name>
<etal/>
</person-group>. (<year>2022</year>). 
<article-title>Creation and trait analysis of &#x2018;Y2001&#x2019;, a high secretory line of &#x2018;Zhongyan100&#x2019;</article-title>. <source>Mol. Plant Breed.</source> <volume>2022</volume>. Available online at: <uri xlink:href="https://kns.cnki.net/kcms/detail/46.1068.S.20220916.1111.020.html">https://kns.cnki.net/kcms/detail/46.1068.S.20220916.1111.020.html</uri> (Accessed <date-in-citation content-type="access-date">March 11, 2025</date-in-citation>).
</mixed-citation>
</ref>
<ref id="B39">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Xavier</surname> <given-names>M.</given-names></name>
<name><surname>Wilfried</surname> <given-names>T.</given-names></name>
</person-group> (<year>2009</year>). 
<article-title>Comparing niche- and process-based models to reduce prediction uncertainty in species range shifts under climate change</article-title>. <source>Ecology.</source> <volume>90</volume>, <fpage>1301</fpage>&#x2013;<lpage>1313</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1890/08-0134.1</pub-id>, PMID: <pub-id pub-id-type="pmid">19537550</pub-id>
</mixed-citation>
</ref>
<ref id="B40">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Yan</surname> <given-names>S.</given-names></name>
<name><surname>Wang</surname> <given-names>P.</given-names></name>
<name><surname>Cai</surname> <given-names>X. J.</given-names></name>
<name><surname>Wang</surname> <given-names>C. L.</given-names></name>
<name><surname>Zwieten</surname> <given-names>L. V.</given-names></name>
<name><surname>Wang</surname> <given-names>H. L.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>Biochar-based fertilizer enhanced tobacco yield and quality by improving soil quality and soil microbial community</article-title>. <source>Environ. Technol. Innov.</source> <volume>37</volume>, <elocation-id>103964</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.eti.2024.103964</pub-id>, PMID: <pub-id pub-id-type="pmid">41737640</pub-id>
</mixed-citation>
</ref>
<ref id="B41">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Yang</surname> <given-names>J. H.</given-names></name>
<name><surname>Mattoo</surname> <given-names>A. K.</given-names></name>
<name><surname>Liu</surname> <given-names>Y.</given-names></name>
<name><surname>Zvomuya</surname> <given-names>F.</given-names></name>
<name><surname>He.</surname> <given-names>L.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>Trade-offs of organic and organic-inorganic fertilizer combinations in tomato quality and yield: A global meta-analysis, (1992&#x2013;2021)</article-title>. <source>Eur. J. Agron.</source> <volume>151</volume>, <elocation-id>126985</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.eja.2023.126985</pub-id>, PMID: <pub-id pub-id-type="pmid">41737640</pub-id>
</mixed-citation>
</ref>
<ref id="B42">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zeng</surname> <given-names>W. B.</given-names></name>
<name><surname>Xie</surname> <given-names>B. L.</given-names></name>
<name><surname>Chen</surname> <given-names>Y. Z.</given-names></name>
<name><surname>Chen</surname> <given-names>J. Z.</given-names></name>
<name><surname>Li</surname> <given-names>P. W.</given-names></name>
<name><surname>Jiang</surname> <given-names>L. J.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>Regulatory mechanism of carbohydrate metabolism pathways on oil biosynthesis of oil plant Symplocos paniculata</article-title>. <source>Front. Plant Sci.</source> <volume>16</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2025.1452533</pub-id>, PMID: <pub-id pub-id-type="pmid">39980488</pub-id>
</mixed-citation>
</ref>
<ref id="B43">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhang</surname> <given-names>S. F.</given-names></name>
<name><surname>Zhang</surname> <given-names>D. K.</given-names></name>
<name><surname>Sun</surname> <given-names>W.</given-names></name>
<name><surname>Zhang</surname> <given-names>D. D.</given-names></name>
<name><surname>Cai</surname> <given-names>Y. M.</given-names></name>
<name><surname>Geng</surname> <given-names>H. M.</given-names></name>
<etal/>
</person-group>. (<year>2021</year>). 
<article-title>Effect of mechanics characteristics of different flavor styles on appearance quality of flue-cured tobacco</article-title>. <source>J. Henan Agric. Sci.</source> <volume>50</volume>, <fpage>58</fpage>&#x2013;<lpage>65</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.15933/j.cnki.1004-3268.2021.02.007</pub-id>
</mixed-citation>
</ref>
<ref id="B44">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhou</surname> <given-names>T. Y.</given-names></name>
<name><surname>Cui</surname> <given-names>R. L.</given-names></name>
<name><surname>Shu</surname> <given-names>C. C.</given-names></name>
<name><surname>Zhu</surname> <given-names>K. Y.</given-names></name>
<name><surname>Zhang</surname> <given-names>W. Y.</given-names></name>
<name><surname>Zhang</surname> <given-names>H.</given-names></name>
<etal/>
</person-group>. (<year>2024</year>). 
<article-title>Combining urea and controlled release nitrogen fertilizer to enhance lodging resistance of rice (Oryza sativa L.) by altering accumulation of silicon and cell wall polymers at high yielding levels</article-title>. <source>Field Crops Res.</source> <volume>315</volume>, <elocation-id>109459</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.fcr.2024.109459</pub-id>, PMID: <pub-id pub-id-type="pmid">41737640</pub-id>
</mixed-citation>
</ref>
<ref id="B45">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhou</surname> <given-names>M.</given-names></name>
<name><surname>Zhang</surname> <given-names>Y.</given-names></name>
<name><surname>Yang</surname> <given-names>J.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>Analysis of nitrogen dynamics and transcriptomic activity revealed a pivotal role of some amino acid transporters in nitrogen remobilization in poplar senescing leaves</article-title>. <source>Plants.</source> <volume>12</volume>, <elocation-id>4140</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/plants12244140</pub-id>, PMID: <pub-id pub-id-type="pmid">38140467</pub-id>
</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn id="n1" fn-type="custom" custom-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/338990">Nirit Bernstein</ext-link>, Agricultural Research Organization (ARO), Israel</p></fn>
<fn id="n2" fn-type="custom" custom-type="reviewed-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2963173">Chaosheng Luo</ext-link>, Yunnan Agricultural University, China</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3011966">Khairul Azree Rosli</ext-link>, Independent Researcher, Malaysia</p></fn>
</fn-group>
</back>
</article>