<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2026.1767299</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Genome-wide detection of superior haplotypes for seed oil and protein content in Northeast China soybean (<italic>Glycine max</italic> L.) germplasm</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Bu</surname><given-names>Moran</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3313529/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname><given-names>Ye</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Xu</surname><given-names>Weitao</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Li</surname><given-names>Yanhua</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Yu</surname><given-names>Hui</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1345381/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname><given-names>Yaohua</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/383931/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Yang</surname><given-names>Suxin</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/530228/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project-administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Bhat</surname><given-names>Javaid Akhter</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/367199/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Feng</surname><given-names>Xianzhong</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/384174/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project-administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Key Laboratory of Soybean Molecular Design Breeding, Northeast Institute of Geography and Agroecology, Chinese Academy of Sciences</institution>, <city>Changchun</city>, <state>Jilin</state>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff2"><label>2</label><institution>College of Advanced Agricultural Sciences, University of Chinese Academy of Sciences</institution>, <city>Beijing</city>,&#xa0;<country country="cn">China</country></aff>
<author-notes>
<corresp id="c001"><label>*</label>Correspondence: Xianzhong Feng, <email xlink:href="mailto:fengxianzhong@iga.ac.cn">fengxianzhong@iga.ac.cn</email>; Javaid Akhter Bhat, <email xlink:href="mailto:javid.akhter69@gmail.com">javid.akhter69@gmail.com</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-24">
<day>24</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>17</volume>
<elocation-id>1767299</elocation-id>
<history>
<date date-type="received">
<day>14</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>26</day>
<month>01</month>
<year>2026</year>
</date>
<date date-type="rev-recd">
<day>24</day>
<month>01</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Bu, Zhang, Xu, Li, Yu, Zhang, Yang, Bhat and Feng.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Bu, Zhang, Xu, Li, Yu, Zhang, Yang, Bhat and Feng</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-24">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<p>Seed oil content (SOC) and seed protein content (SPC) are the crucial traits determining the economic importance of soybeans. However, the molecular mechanism underlying the high SOC and low SPC of Northeast China soybeans is still limited. To address this, we elucidated the genetic basis of SOC and SPC in soybean germplasm adapted to Northeast China by employing an integrated genomic analysis. The genome-wide association study (GWAS) detected 105 and 59 significant SNPs associated with the SOC and SPC, respectively across four environments plus combined environment (CE). The haplotype allele number in the 15 identified haplotype blocks varied from 2&#x2013;4 regulating the SOC and SPC in the range of 16.68-21.15% and 38.63-42.69%, respectively. Five quantitative trait loci (QTLs) among the total 17 identified QTLs were novel that include <italic>qSOC1</italic>, <italic>qSPC1</italic>, <italic>qSOC9</italic>, <italic>qSOC_SPC15.1</italic> and <italic>qSOC_SPC15.2</italic> associated with SOC or/and SPC. Based on the <italic>in-silico</italic>, variant annotation and haplotype analysis, the 80 genes were prioritized as potential candidates. The haplotype alleles of these genes varied from 2&#x2013;8 regulating SOC and SPC in the range of 15.98-21.23% and 37.69%-43.30%, respectively. Twelve of 80 genes showed distinct selection signatures between the two populations, suggesting their key roles in shaping the specific seed quality profiles of soybean germplasm in Northeast China. Hence, the current study provides novel insights on divergent breeding influencing the local adaptation and seed quality difference between different regional soybean populations. Besides, the stable QTLs, superior haplotypes and candidate genes identified can be used for soybean improvement.</p>
</abstract>
<kwd-group>
<kwd>GWAS</kwd>
<kwd>haplotype</kwd>
<kwd>Northeast China</kwd>
<kwd>oil content</kwd>
<kwd>protein content</kwd>
<kwd>soybean</kwd>
</kwd-group>
<funding-group>
<award-group id="gs1">
<funding-source id="sp1">
<institution-wrap>
<institution>National Major Science and Technology Projects of China</institution>
<institution-id institution-id-type="doi" vocab="open-funder-registry" vocab-identifier="10.13039/open_funder_registry">10.13039/501100013076</institution-id>
</institution-wrap>
</funding-source>
</award-group>
<award-group id="gs2">
<funding-source id="sp2">
<institution-wrap>
<institution>National Natural Science Foundation of China</institution>
<institution-id institution-id-type="doi" vocab="open-funder-registry" vocab-identifier="10.13039/open_funder_registry">10.13039/501100001809</institution-id>
</institution-wrap>
</funding-source>
<award-id rid="sp2">32488102, U21A20215</award-id>
</award-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This research was supported by Sanjiang Laboratory (SJ2025003), Biological Breeding&#x2013;National Science and Technology Major Project of China (2023ZD04032), the National Natural Science Foundation of China (32488102 &amp; U21A20215) and Key project of Jilin Province (2025JLGJ0009NC).</funding-statement>
</funding-group>
<counts>
<fig-count count="9"/>
<table-count count="2"/>
<equation-count count="1"/>
<ref-count count="101"/>
<page-count count="22"/>
<word-count count="12323"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Functional and Applied Plant Genomics</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Soybean possesses high nutritional significance as their seeds have high content of oil and protein; and the average seed oil content (SOC) and seed protein content (SPC) in soybean is 20% and 40%, respectively (<xref ref-type="bibr" rid="B21">Guo et&#xa0;al., 2022</xref>). These features make the soybean as the fifth major crop in the world production, and is cultivated globally (<xref ref-type="bibr" rid="B29">Karges et&#xa0;al., 2022</xref>). Soybean oil is consumed by humans as well as used for industrial applications; besides, soybeans provide plant proteins to humans and livestock&#x2019;s; hence, the improvement of the SOC and SPC has central importance in the soybean breeding program (<xref ref-type="bibr" rid="B47">Majidian et&#xa0;al., 2024</xref>). Although, conventional breeding has made considerable efforts in the development of soybean cultivars with high SOC, these achievements have been made at the cost of reducing the SPC and vice versa (<xref ref-type="bibr" rid="B39">Li et&#xa0;al., 2019</xref>). The significant strong negative correlation between SOC and SPC has made it difficult for the conventional breeding to simultaneously improve these both traits in the same soybean cultivar (<xref ref-type="bibr" rid="B54">Mo et&#xa0;al., 2024</xref>). In this context, the molecular breeding can allow the simultaneous improvement of SOC and SPC in the same cultivar by using the independent or non-correlated MTAs (marker-trait associations)/QTLs (quantitative trait loci)/genes (<xref ref-type="bibr" rid="B58">Nair and Rabbani, 2024</xref>). However, molecular breeding requires the elucidation of detailed genetic architecture for these traits. Identifying and confirming the independent genetic loci associated with the SOC and SPC will allow the development of soybean cultivars with high seed oil and protein content; that in turn will increase the economic value and consumer acceptance of the soybeans.</p>
<p>Although, substantial attempts have been made in the past to detect the genetic elements associated with SOC and SPC traits in soybean; to this end, ~330 and 250 QTLs linked with SOC and SPC, respectively are deposited in the SoyBase (<ext-link ext-link-type="uri" xlink:href="http://www.soybase.org">http://www.soybase.org</ext-link>). Mostly the classical approach of linkage mapping involving the use of biparental population which possesses the lower number of recent recombination events has been utilized for the detection of these QTLs, thus has the limitation of low-resolution and larger confidence interval (<xref ref-type="bibr" rid="B6">Capilla-P&#xe9;rez et&#xa0;al., 2024</xref>). The disadvantage of low-resolution has in turn restricted the use of these QTLs in the practical soybean breeding for the enhancement of SOC and SPC (<xref ref-type="bibr" rid="B30">Karikari et&#xa0;al., 2019</xref>). In this context, the association mapping approach has the benefits of higher resolution and precision because it uses the diverse natural population that has undergone recombination over thousands to millions of years, thus has emerged as a more realistic method for molecular breeding applications (<xref ref-type="bibr" rid="B35">Leventhal et&#xa0;al., 2025</xref>). There are multiple studies in which the association mapping/GWAS (genome-wide association study) has been used for the SOC and SPC traits in soybean; and majority of these studies were performed in low-latitude regions. For example, <xref ref-type="bibr" rid="B39">Li et&#xa0;al. (2019)</xref> performed the association mapping for SOC and SPC traits by using 185 diverse accessions of soybean that were genotyping with SLAF-seq technology; and they identified 31 MTAs linked with SOC and SPC distributed on the 12 out of total 20 soybean chromosomes. Similarly, <xref ref-type="bibr" rid="B34">Lee et&#xa0;al. (2019)</xref> used the 621 diverse accessions of soybean in the GWAS analysis of SOC and SPC, and this panel was genotyping using SoySNP50K array; and they detected 19 and 16 significant MTAs linked with the SOC and SPC, respectively. <xref ref-type="bibr" rid="B8">Chen et&#xa0;al. (2025)</xref> used the nested-association population (NAM) of 1107 soybean accessions genotyping with SoySNP50K array, and they detected 104 and 99 MTAs associated with SOC and SPC, respectively. Moreover, <xref ref-type="bibr" rid="B15">Doszhanova et&#xa0;al. (2024)</xref> used 252 diverse soybean accessions genotyping with whole genome resequencing (WGRS), and they identified nine and nine MTAs linked with the SOC and SPC, respectively. There are some other studies that have used the GWAS for SOC and SPC traits in low-latitude regions (<xref ref-type="bibr" rid="B24">He et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B31">Kim et&#xa0;al., 2023</xref>; <xref ref-type="bibr" rid="B89">Yuan et&#xa0;al., 2024</xref>; <xref ref-type="bibr" rid="B60">Patel et&#xa0;al., 2025</xref>). However, some studies of GWAS have been carried out for SOC and SPC for soybeans in high-latitude regions. For instance, <xref ref-type="bibr" rid="B94">Zhang et&#xa0;al. (2025)</xref> have used the four-way recombinant inbred line (FW-RIL) populations for GWAS of SPC, and they have identified 18 MTAs linked with SPC.</p>
<p>The SOC and SPC being the complex traits are regulated by numerous genes, and limited attempts have been made to identify the actual genes governing the SOC and SPC in soybean. Hence, there is a need to detect actual genes governing these traits in soybean. Genes such as <italic>GmSWEET10</italic>, <italic>GmOLEO1</italic> and <italic>GmST05/GmMFT</italic> regulate the SOC positively, but they regulate the SPC negatively (<xref ref-type="bibr" rid="B97">Zhang et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B79">Wang et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B56">Mukherjee et&#xa0;al., 2023</xref>). In contrast, the genes such as <italic>POWR1-TE</italic>, <italic>GmJAZ3</italic> and <italic>GmSDP1</italic> positively regulate the SPC but negatively regulate SOC (as reviewed by <xref ref-type="bibr" rid="B54">Mo et&#xa0;al. (2024)</xref>). The <italic>GmSop20</italic> has been reported to serve as a key gene regulating the SOC/SPC ratio in soybean (<xref ref-type="bibr" rid="B99">Zheng et&#xa0;al., 2025</xref>). Moreover, the <italic>ST1</italic> gene has been documented to regulate SOC in soybean (<xref ref-type="bibr" rid="B38">Li et&#xa0;al., 2022</xref>). The biosynthesis of fatty acids and amino acids are significantly determined by the allocation of the nitrogen and carbon sources, and breakdown of carbohydrate substances are the major source for providing the materials in the synthesis of oil and protein. The <italic>GmSWEET10</italic> (<italic>Glyma.15G049200</italic>) is a sugar transporter gene that controls the SOC and SPC accumulation (<xref ref-type="bibr" rid="B79">Wang et&#xa0;al., 2020</xref>). Besides, the SPC of soybean is regulated by other proteins such as GTPase (encoded by <italic>GmRab5a</italic>), guanyl-nucleotide releasing factors and methionine lyase (<xref ref-type="bibr" rid="B83">Wei et&#xa0;al., 2019</xref>). Hence, substantial attempts are required to detect the genes regulating SOC and SPC in soybean.</p>
<p>In the past, association mapping has predominantly utilized the biallelic single nucleotide polymorphism (SNP) markers, which has greatly decreased the efficiency of GWAS because it can capture only two alleles in the diverse soybean germplasm. But there are multiple alleles of the genetic loci or gene across the diverse soybean panel, which might be rare and superior, and go uncaptured (<xref ref-type="bibr" rid="B43">Liu et&#xa0;al., 2025</xref>). In this context multiallelic haplotype markers can overcome these challenges; and the better performance of haplotype markers relative to the SNP markers are documented through both empirical and simulation methods (<xref ref-type="bibr" rid="B88">Yu et&#xa0;al., 2024</xref>). The superior and rare haplotypes are reported for various agronomic traits in rice (<xref ref-type="bibr" rid="B1">Abbai et&#xa0;al., 2019</xref>) and stress tolerance in rice and pigeonpea (<xref ref-type="bibr" rid="B32">Kuroha et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B70">Sinha et&#xa0;al., 2020</xref>). In soybean, the superior haplotypes are detected for plant height, yield-related traits and branch number (<xref ref-type="bibr" rid="B40">Liang et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B69">Shao et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B65">Qin et&#xa0;al., 2023</xref>). However, almost no efforts have been made in the detection of superior haplotypes for SOC and SPC traits in soybean. Hence, there is a need to identify these genetic elements for these traits in soybean.</p>
<p>It has been documented that SOC and SPC exhibit a significant latitudinal gradient (<xref ref-type="bibr" rid="B21">Guo et&#xa0;al., 2022</xref>). The SOC has direct relationship with the latitude i.e., SOC increases with the latitude in soybean; in contrast, SPC is negatively correlated with latitude (<xref ref-type="bibr" rid="B68">Rotundo et&#xa0;al., 2016</xref>). For example, it has been documented that SOC and SPC are low and high, respectively, in the soybeans grown in the Southern US relative to those cultivated in Northern US (<xref ref-type="bibr" rid="B68">Rotundo et&#xa0;al., 2016</xref>). In China, the SOC and SPC are high and low, respectively in the soybeans cultivated in Northeast China compared to those grown in Huanghuaihai region and southern parts of China (<xref ref-type="bibr" rid="B72">Song et&#xa0;al., 2023</xref>). The varied environmental conditions across the different latitudes significantly affect the SOC and SPC in soybeans. The cool weather and long-day conditions are favorable for oil biosynthesis, while warm weather and short-day conditions are favorable for protein accumulation (<xref ref-type="bibr" rid="B27">Kalantar Ahmadi and Sarhangi, 2025</xref>). In addition, delayed sowing may result in a decrease of SPC, which is the important reason in the high-latitude regions (<xref ref-type="bibr" rid="B90">Zelaya Arce et&#xa0;al., 2025</xref>). In total, the environmental factors in high-latitude regions such as lower temperature, reduced growth season and environmental stress factors enforce the soybean plants to biosynthesis and accumulate more SOC relative to SPC as a strategy for adaptation. This can be explained as, in the high-latitude regions of Northeast China, the temperature is low at the sowing time and maturity time; hence, presence of the high SOC rich in unsaturated fatty acids can allow the normal germination of the soybean seeds as well as the survival of the seeds at maturity time. Because the oil can be in liquid form and not frozen at the low temperature, thus will be the most suitable source of energy in the high-latitudes during the seed germination (<xref ref-type="bibr" rid="B100">Zhou et&#xa0;al., 2025</xref>). Hence, the soybeans adapted to Northeast China/high-latitudes have genetic adaptations that favor oil production, as this could improve the plant&#x2019;s ability to endure harsh climates. This could come at the cost of protein content, which may be less of a priority for the plant in extreme conditions.</p>
<p>Here, we utilized a diverse collection of soybean accessions adapted to the Northeast region of China to investigate the genetic basis of SOC and SPC. To achieve this, we employed a combined strategy that integrated association mapping, haplotype analysis, QTL analysis and candidate gene analysis. The results of our investigation revealed significant SNPs, superior haplotypes, stable genomic loci/QTLs and candidate genes associated with SOC and SPC in soybean. The detected SNPs, superior haplotypes, genomic loci and genes could be potentially deployed in soybean breeding programs aimed at producing soybean cultivars with both high SOC and SPC. Besides, our results revealed divergent breeding of key genes may result in local adaptation and the specific quality profile of soybeans in Northeast China.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Plant materials and field experiments</title>
<p>Here, a set of 340 diverse accessions of soybean derived from the different growing regions of China were used as plant material (<xref ref-type="supplementary-material" rid="SF9"><bold>Supplementary Table S1</bold></xref>). These soybean accessions were planted under natural conditions at two separate locations of the Jilin province viz., Changchun (CC) and Jiutai (JT). In the CC location, the accessions were grown in the experimental field of the Northeast Institute of Geography and Agroecology, Chinese Academy of Sciences (44&#xb0;0&#x2019;N, 125&#xb0;24&#x2019;E), on the following dates: April 29<sup>th</sup>, 2022 (CC22); April 28<sup>th</sup>, 2023 (CC23); and April 30<sup>th</sup>, 2024 (CC24), respectively; whereas these accessions were grown on May 10<sup>th</sup>, 2024 in the experimental field of Changchun Polytechnic (44&#xb0;4&#x2019;N, 125&#xb0;40&#x2019;E, Jiutai District, Changchun), representing the environment JT24. Hence, the diverse soybean germplasm resources were accessed across the four different environments viz., CC22, CC23, CC24 &amp; JT24. The randomized complete block design (RCBD) involving three replications was used for planting this germplasm. The plot of each soybean accession was consisted of three rows with the spacing between the rows maintained at 50 cm and the length of row kept at 200 cm. At the maturity stage, the seeds of each accession were harvested in the main season of all four environments. The soybean germplasm was cultivated following the normal agronomic practices.</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Phenotypic analysis of SOC and SPC</title>
<p>The seed samples collected were placed in a cup with a bottom of 5 cm in diameter, and a height of 3 cm for near-infrared spectroscopy analysis; and the seeds were analyzed without any treatment and in good condition. The cup was filled with the equivalent of about 60 ml of soybean seed (about 20 g or 80 seeds). Spectra acquisition was carried out using a Fourier transform near-infrared (FTNIR) analyzer (Antaris II spectrometer: Thermofisher Scientific, France). The SOC and SPC were expressed in percentage by weight of seeds. Phenotypic data of SOC and SPC were estimated for each accession in three replications for all four environments. The SOC and SPC were estimated in each replication, and the average of three replications was used for further analysis. The combined environment (CE) data were derived from the data of individual environments by utilizing the &#x201c;lme4&#x201d; package in R environment (<xref ref-type="bibr" rid="B4">Bates et&#xa0;al., 2015</xref>). The predicted means (best linear unbiased predictions, BLUPs) for the CE were calculated by fitting the following model:</p>
<disp-formula>
<mml:math display="block" id="M1"><mml:mrow><mml:msub><mml:mi>Y</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mo>&#xa0;</mml:mo><mml:mi>&#x3bc;</mml:mi><mml:mo>+</mml:mo><mml:msub><mml:mi>G</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>E</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:mi>G</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mi>R</mml:mi><mml:mi>e</mml:mi><mml:msub><mml:mi>p</mml:mi><mml:mi>k</mml:mi></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mi>E</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>+</mml:mo><mml:msub><mml:mi>&#x3f5;</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math display="inline" id="im1"><mml:mrow><mml:msub><mml:mi>Y</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> is the phenotypic value of the <italic>i</italic>-th genotype in the <italic>k</italic>-th replication of the <italic>j</italic>-th environment, <inline-formula>
<mml:math display="inline" id="im2"><mml:mi>&#x3bc;</mml:mi></mml:math></inline-formula> is the overall mean, <inline-formula>
<mml:math display="inline" id="im3"><mml:mrow><mml:msub><mml:mi>G</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is the random effect of the <italic>i</italic>-th genotype, <inline-formula>
<mml:math display="inline" id="im4"><mml:mrow><mml:msub><mml:mi>E</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> is the random effect of the <italic>j</italic>-th environment, <inline-formula>
<mml:math display="inline" id="im5"><mml:mrow><mml:mi>G</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> is the random effect of the genotype-by-environment interaction, <inline-formula>
<mml:math display="inline" id="im6"><mml:mrow><mml:mi>R</mml:mi><mml:mi>e</mml:mi><mml:msub><mml:mi>p</mml:mi><mml:mi>k</mml:mi></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mi>E</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow></mml:math></inline-formula> is the random effect of the block nested within the <italic>j</italic>-th environment, and <inline-formula>
<mml:math display="inline" id="im7"><mml:mrow><mml:msub><mml:mi>&#x3f5;</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math></inline-formula> is the random error. The analysis of variance (ANOVA) was calculated by utilizing the R language. The broad-sense heritability (<italic>H</italic>) was estimated as <inline-formula>
<mml:math display="inline" id="im8"><mml:mrow><mml:msubsup><mml:mi>&#x3c3;</mml:mi><mml:mi>G</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mo stretchy="false">/</mml:mo><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msubsup><mml:mi>&#x3c3;</mml:mi><mml:mi>G</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:msubsup><mml:mi>&#x3c3;</mml:mi><mml:mrow><mml:mi>G</mml:mi><mml:mi>E</mml:mi></mml:mrow><mml:mn>2</mml:mn></mml:msubsup><mml:mo stretchy="false">/</mml:mo><mml:mi>n</mml:mi><mml:mo>+</mml:mo><mml:msubsup><mml:mi>&#x3c3;</mml:mi><mml:mi>&#x3f5;</mml:mi><mml:mn>2</mml:mn></mml:msubsup><mml:mo stretchy="false">/</mml:mo><mml:mi>n</mml:mi><mml:mi>r</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow></mml:math></inline-formula>, in which the <inline-formula>
<mml:math display="inline" id="im9"><mml:mrow><mml:msubsup><mml:mi>&#x3c3;</mml:mi><mml:mi>G</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:math></inline-formula>, <inline-formula>
<mml:math display="inline" id="im10"><mml:mrow><mml:msubsup><mml:mi>&#x3c3;</mml:mi><mml:mrow><mml:mi>G</mml:mi><mml:mi>E</mml:mi></mml:mrow><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:math></inline-formula> and <inline-formula>
<mml:math display="inline" id="im11"><mml:mrow><mml:msubsup><mml:mi>&#x3c3;</mml:mi><mml:mi>&#x3f5;</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:math></inline-formula> represent the genotypic variance, genotype &#xd7; environment interaction variance, and residual variance, respectively, <italic>n</italic> is the number of environments, and <italic>r</italic> is the number of replications within each environment.</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Genotyping of plant materials</title>
<p>The resequencing data for the soybean accessions were obtained from our previously published study (<xref ref-type="bibr" rid="B96">Zhang et&#xa0;al., 2024b</xref>). Briefly, the genomic DNA was extracted from fresh and healthy leaf tissues of three-week-old seedlings using the cetyltrimethylammonium bromide (CTAB) method (<xref ref-type="bibr" rid="B57">Murray and Thompson, 1980</xref>). The genomic DNA was fragmented to a target size of 350 bp. Library preparation was performed by Gene Denovo Biotechnology Co., Ltd. (Guangzhou, China) sequenced on the DNBSEQ-T7 platform (BGI, Shenzhen, China) by Gene Denovo Biotechnology Co., Ltd. (Guangzhou, China). The average depth of resequencing was 25 &#xd7; and the volume of the total data produced was 8.57 Tb. The fastp software (<xref ref-type="bibr" rid="B9">Chen et&#xa0;al., 2018</xref>) was utilized to eliminate the reads with low quality, reads with &gt; 10% N content and adapter sequences; and we retained only the clean reads. The Burrows-Wheeler Aligner software (<xref ref-type="bibr" rid="B36">Li, 2013</xref>) was utilized to map the sequence reads with the reference genome of Wm82.a2.v1. The Genome Analysis Toolkit (<xref ref-type="bibr" rid="B50">McKenna et&#xa0;al., 2010</xref>) was used to identify the sequence variants such as SNPs, insertions/deletions (InDels) and other larger variants; and in this way we identified a total of 25,442,248 genetic variants. Furthermore, we utilized the stringent measures of quality control viz., missing rate greater than 10% and minor allele frequency less than 0.05, and finally detected high-quality SNPs of 3,343,372, with the mean heterozygous rate of 0.094.</p>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Population structure and linkage disequilibrium analysis</title>
<p>The PCA result and kinship of GWAS panel were generated by GAPIT package (<xref ref-type="bibr" rid="B81">Wang and Zhang, 2021</xref>) in R environment. The PopLDdecay software v3.43 (<xref ref-type="bibr" rid="B92">Zhang et&#xa0;al., 2018a</xref>) was used for LD decay calculation with the following parameters: -MaxDist 300, -MAF 0.05, and -Miss 0.1.</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Association mapping analysis</title>
<p>For association mapping analysis, the study utilized the GAPIT package (<xref ref-type="bibr" rid="B81">Wang and Zhang, 2021</xref>). Seven different GWAS models were used viz., GLM (General Linear Model), MLM (Mixed Linear Model), CMLM (Compressed Mixed Linear Model), MLMM (Multi-Locus Mixed Linear Model), SUPER (Settlement of MLM Under Progressively Exclusive Relationship), FarmCPU (Fixed and random model Circulating Probability Unification) and BLINK (Bayesian-information and Linkage-disequilibrium Iteratively Nested Keyway). The multiple models were used because various models of GWAS are built on divergent hypotheses involving different distribution characteristics of QTL effects. Among these, MLMM, BLINK, SUPER, and FarmCPU are considered multi-locus models, whereas GLM, MLM and CMLM are categorized as single-locus GWAS models. The default parameters of GAPIT were employed to detect significant SNP associations. The GAPIT package in the R program was employed for conducting principal component analysis (PCA) and kinship analysis to assess population structure (<xref ref-type="bibr" rid="B42">Lipka et&#xa0;al., 2012</xref>). To visualize population structure in R environment, we used the &#x201c;plotly&#x201d; package. A suggestive association threshold (i.e., 1/<italic>N<sub>test</sub></italic>) was set at <italic>P</italic> &lt; 2.99 &#xd7; 10<sup>-7</sup>, which reflects the level at which, under the null hypothesis, one false positive result is expected across the entire genome scan (<xref ref-type="bibr" rid="B33">Lander and Kruglyak, 1995</xref>; <xref ref-type="bibr" rid="B18">Duggal et&#xa0;al., 2008</xref>; <xref ref-type="bibr" rid="B80">Wang et&#xa0;al., 2012</xref>; <xref ref-type="bibr" rid="B37">Li et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B22">Guo et&#xa0;al., 2017</xref>). The UpSetR package was used to draw the UpSet plots (<xref ref-type="bibr" rid="B11">Conway et&#xa0;al., 2017</xref>).</p>
</sec>
<sec id="s2_6">
<label>2.6</label>
<title>Haplotype analysis</title>
<p>To determine the level of LD between pairs of SNPs, we employed the Haploview 4.2 software (<xref ref-type="bibr" rid="B3">Barrett et&#xa0;al., 2004</xref>). A haplotype block was determined when two or more than 2 significant SNPs were present in the same chromosome, and these SNPs were present within the LD decay distance in the upstream and downstream of chromosome such as &#xb1; 71.7 kb in the present study. Pairwise means were analyzed using Fisher&#x2019;s Least Significant Difference (LSD) Test, and visualization of the results was performed in the R environment.</p>
</sec>
<sec id="s2_7">
<label>2.7</label>
<title>Candidate gene identification</title>
<p>Gene models that were present across the genomic interval of 17 QTLs along with their function annotation were collected from SoyBase (<ext-link ext-link-type="uri" xlink:href="https://www.soybase.org/">https://www.soybase.org/</ext-link>); and soybean genome version of Wm82.a2.v1 was utilized to collect the gene model information. The information about gene ontology (GO) was obtained from SoyBase (<ext-link ext-link-type="uri" xlink:href="https://www.soybase.org/">https://www.soybase.org/</ext-link>). The analysis of GO enrichment was carried out by utilizing the agriGO V2.0 (<ext-link ext-link-type="uri" xlink:href="https://systemsbiology.cau.edu.cn/agriGOv2/">https://systemsbiology.cau.edu.cn/agriGOv2/</ext-link>) tool (<xref ref-type="bibr" rid="B74">Tian et&#xa0;al., 2017</xref>). The publicly available RNA-seq data at SoyMD (<ext-link ext-link-type="uri" xlink:href="https://yanglab.hzau.edu.cn/SoyMD/#/">https://yanglab.hzau.edu.cn/SoyMD/#/</ext-link>) for different tissues/organs as well as development stages were collected for the model genes (<xref ref-type="bibr" rid="B86">Yang et&#xa0;al., 2023</xref>). The heatmap of transcriptomic data was produced by utilizing the ComplexHeatmap package of R software (<xref ref-type="bibr" rid="B20">Gu et&#xa0;al., 2016</xref>). Initial screening of the putative candidate genes was carried out using the <italic>in-silico</italic> analysis and a literature survey. The genes selected based on the initial step were further screened using the variant annotation and haplotype analysis; and the genes fulfilling the criteria of variant annotation and haplotype differences were prioritized as potential candidate genes regulating the SOC and SPC in soybean. The variant annotation was carried out by utilizing the SnpEff software (<xref ref-type="bibr" rid="B10">Cingolani et&#xa0;al., 2012</xref>).</p>
<p>The sequencing data for the haplotype selection analysis of soybean accessions adapted to different latitudes of China has been collected from SoyMD (<ext-link ext-link-type="uri" xlink:href="https://yanglab.hzau.edu.cn/SoyMD/#/">https://yanglab.hzau.edu.cn/SoyMD/#/</ext-link>). The different regions of China have been divided into China-I, China-II, China-III, China-IV, China-V and China-VI (<xref ref-type="bibr" rid="B45">Liu et&#xa0;al., 2023</xref>); China-I has the highest latitude including the Northeast China; China-II has the mid-latitude that includes Huanghuaihai regions; and China-III to China-VI include the Southern China and have low-latitude. Pairwise <italic>F<sub>ST</sub></italic> values were estimated by using the window size of 5 kb and a step size of 200 bp using VCFtools (<xref ref-type="bibr" rid="B13">Danecek et&#xa0;al., 2011</xref>). Nucleotide diversity (<italic>&#x3c0;</italic>) values within various populations were also evaluated using VCFtools (<xref ref-type="bibr" rid="B13">Danecek et&#xa0;al., 2011</xref>) with a fixed window of 5 kb and a step size of 200 bp. Tajima&#x2019;s <italic>D</italic> values were evaluated using VCF-kit (<xref ref-type="bibr" rid="B12">Cook and Andersen, 2017</xref>) with a fixed window of 5 kb and a step size of 200 bp.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>Phenotypic analysis of SOC and SPC</title>
<p>The mean values of the SOC and SPC across the four different environments, viz. CC22, CC23, CC24 and JT24 are revealed in the violin plots (<xref ref-type="fig" rid="f1"><bold>Figures&#xa0;1A, B</bold></xref>; <xref ref-type="supplementary-material" rid="SF1"><bold>Supplementary Figure&#xa0;1</bold></xref>). The average values of SOC showed significant differences among the four environments; however, the average values of SOC exhibited non-significant differences between CC22 and CC23, while the remaining comparison groups of environments showed significant differences in the average values of SOC (<xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1A</bold></xref>). The average values of SPC revealed significant differences among the four environments, but the non-significant differences were observed between CC22 and JT24 for the SPC; while the significant differences were observed for the average values of SPC in the remaining comparison groups (<xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1B</bold></xref>). The frequency distributions of SOC and SPC traits in the set of 340 diverse soybean accessions across four individual environments, viz. CC22, CC23, CC24 &amp; JT24, are shown in <xref ref-type="supplementary-material" rid="SF1"><bold>Supplementary Figure&#xa0;1</bold></xref>. The scatter plots of SOC and SPC traits in CC22, CC23, CC24, JT24 environments and the CE shown in <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1C</bold></xref> and the Pearson correlation coefficients between these traits in different individual environments and the CE (-0.41, -0.46, -0.41, -0.36 and -0.34, <italic>P</italic> &lt; 0.0001) underscored a consistent moderate negative correlation between SOC and SPC across different environments in our soybean population.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Comparison of trait values and correlation analysis of SOC and SPC across 340 soybean accessions. <bold>(A)</bold> Comparison of average values of the SOC across four individual environments viz., CC22, CC23, CC24 &amp; JT24 in the soybean germplasm. <bold>(B)</bold> Comparison of average values of the SPC across four individual environments viz., CC22, CC23, CC24 &amp; JT24 in the soybean germplasm. <bold>(C)</bold> Scatter plot of SOC and SPC traits in the soybean germplasm across the four individual environments (CC22, CC23, CC24 &amp; JT24) plus combined environments (CE). The different letters at the top of density curve correspond to differences at the significant level, whereas the same letters correspond to differences at the non-significant levels.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767299-g001.tif">
<alt-text content-type="machine-generated">Scientific figure with three panels: Panel A shows a violin plot comparing SOC across four environments (CC22, CC23, CC24, JT24), revealing significant differences marked by letter groupings above each plot; Panel B presents a similar violin plot for SPC across the same environments, also showing significant differences via letter groupings; Panel C displays five scatterplots, each plotting SOC against SPC for one environment (CC22, CC23, CC24, JT24, CE), all indicating a negative correlation between the two variables. A color-coded legend identifies each environment.</alt-text>
</graphic></fig>
<p>The parameters of descriptive statistics for the SOC and SPC traits in 340 soybean cultivars across four individual environments, viz. CC22, CC23, CC24 &amp; JT24 plus the CE, are presented in <xref ref-type="supplementary-material" rid="SF10"><bold>Supplementary Table S2</bold></xref>. The average values of the SOC ranged from 19.21 to 20.56% in the environments of CC23 and JT24, respectively; and the minimum and maximum values for the SOC were 13.59% and 24.67% in the environments of CC22 and JT24, respectively. The coefficients of variation (CVs) of SOC varied from 7.62 to 8.37% in the environments of JT24 and CC23, respectively; and the CV of SOC in the CE was 7.11%. The skewness of the SOC varied from -0.79 to -0.21 in the JT24 and CC23 environments, respectively; and the kurtosis of SOC ranged from 0.52 to 1.37 in the environments of CC23 and CE, respectively. Broad-sense heritability (<italic>H</italic>) for SOC was high equal to 0.86 (<xref ref-type="supplementary-material" rid="SF10"><bold>Supplementary Table S2</bold></xref>). The results of ANOVA analysis showed highly significant (<italic>P&lt;0.0001</italic>) variances of genotype (<italic>G</italic>), environment (<italic>E</italic>) and genotype &#xd7; environment (<italic>G &#xd7; E</italic>) interaction for the SOC (<xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>).</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Analysis of variance (ANOVA) for SOC and SPC in combined environment.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Trait</th>
<th valign="middle" align="left">Source</th>
<th valign="middle" align="left">DF</th>
<th valign="middle" align="left">SS</th>
<th valign="middle" align="left">MS</th>
<th valign="middle" align="left"><italic>F</italic> value</th>
<th valign="middle" align="left"><italic>P</italic> value (Prob&#x2009;&gt;&#x2009;<italic>F</italic>)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="5" align="left">SOC</td>
<td valign="middle" align="left">Block within <italic>E</italic></td>
<td valign="middle" align="left">10</td>
<td valign="middle" align="left">24.406</td>
<td valign="middle" align="left">2.441</td>
<td valign="middle" align="left">4.543</td>
<td valign="middle" align="left">&lt;0.0001 ***</td>
</tr>
<tr>
<td valign="middle" align="left">Genotype(<italic>G</italic>)</td>
<td valign="middle" align="left">339</td>
<td valign="middle" align="left">8975.567</td>
<td valign="middle" align="left">26.476</td>
<td valign="middle" align="left">49.286</td>
<td valign="middle" align="left">&lt;0.0001 ***</td>
</tr>
<tr>
<td valign="middle" align="left">Environment(<italic>E</italic>)</td>
<td valign="middle" align="left">3</td>
<td valign="middle" align="left">1161.514</td>
<td valign="middle" align="left">387.171</td>
<td valign="middle" align="left">720.719</td>
<td valign="middle" align="left">&lt;0.0001 ***</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>G</italic> &#xd7; <italic>E</italic></td>
<td valign="middle" align="left">1017</td>
<td valign="middle" align="left">2413.120</td>
<td valign="middle" align="left">2.373</td>
<td valign="middle" align="left">4.417</td>
<td valign="middle" align="left">&lt;0.0001 ***</td>
</tr>
<tr>
<td valign="middle" align="left">Residuals</td>
<td valign="middle" align="left">3201</td>
<td valign="middle" align="left">1719.582</td>
<td valign="middle" align="left">0.537</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" rowspan="5" align="left">SPC</td>
<td valign="middle" align="left">Block within <italic>E</italic></td>
<td valign="middle" align="left">10</td>
<td valign="middle" align="left">51.188</td>
<td valign="middle" align="left">5.119</td>
<td valign="middle" align="left">3.763</td>
<td valign="middle" align="left">&lt;0.0001 ***</td>
</tr>
<tr>
<td valign="middle" align="left">Genotype(<italic>G</italic>)</td>
<td valign="middle" align="left">339</td>
<td valign="middle" align="left">14372.447</td>
<td valign="middle" align="left">42.397</td>
<td valign="middle" align="left">31.165</td>
<td valign="middle" align="left">&lt;0.0001 ***</td>
</tr>
<tr>
<td valign="middle" align="left">Environment(<italic>E</italic>)</td>
<td valign="middle" align="left">3</td>
<td valign="middle" align="left">5126.621</td>
<td valign="middle" align="left">1708.874</td>
<td valign="middle" align="left">1256.154</td>
<td valign="middle" align="left">&lt;0.0001 ***</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>G</italic> &#xd7; <italic>E</italic></td>
<td valign="middle" align="left">1017</td>
<td valign="middle" align="left">5845.622</td>
<td valign="middle" align="left">5.748</td>
<td valign="middle" align="left">4.225</td>
<td valign="middle" align="left">&lt;0.0001 ***</td>
</tr>
<tr>
<td valign="middle" align="left">Residuals</td>
<td valign="middle" align="left">3201</td>
<td valign="middle" align="left">4354.645</td>
<td valign="middle" align="left">1.360</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>DF, degrees of freedom; SS, sum of squares; MS, mean sum of squares; E, environment; Prob, probability; <italic>P</italic> value&lt; 0.0001, significant.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>The average values of the SPC ranged from 39.75 to 42.23% in the environments of CC22 and CC23, respectively; and the minimum and maximum values of SPC were 31.72% and 50.83% in the environments of CC22 and CC23, respectively. The CVs for the SPC varied from 4.58 to 5.59% in the environments of CC24 and CC22, respectively; and the CV of SPC in the CE was 4.36%. The skewness for the SPC ranged from -0.11 to 0.02 in the CC22 and CC23 environments, respectively; and the kurtosis of SPC varied from 0.02 to 0.50 in the environments of CC24 and CC23, respectively. Broad-sense heritability (<italic>H</italic>) for SPC was high, and was equal to 0.79 (<xref ref-type="supplementary-material" rid="SF10"><bold>Supplementary Table S2</bold></xref>). The results of ANOVA analysis showed highly significant (<italic>P&lt;</italic>0.0001) variances of <italic>G</italic>, <italic>E</italic> and <italic>G &#xd7; E</italic> interaction for the SPC (<xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>).</p>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Population structure and linkage disequilibrium analysis</title>
<p>Here, we detected 3,343,372 high-quality SNPs by applying the stringent measures of quality control (<xref ref-type="supplementary-material" rid="SF11"><bold>Supplementary Table S3</bold></xref>). The distribution of these SNPs was located across the whole genome of the soybean; the lowest and highest SNPs were present on Chr.11 (63,224) and Chr.15 (256,000), respectively, with an average number of 167,168.6 SNPs per chromosome (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2B</bold></xref>; <xref ref-type="supplementary-material" rid="SF11"><bold>Supplementary Table S3</bold></xref>). Substantial variation was observed for the marker density among the various soybean chromosomes; for example, the lowest marker density of 1,818.51 SNPs/Mb was observed on Chr.11, and the highest marker density of 4,946.25 SNPs/Mb was observed on Chr.15, and the mean value of the marker density was 3,522.37 SNPs/Mb (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2A</bold></xref>; <xref ref-type="supplementary-material" rid="SF11"><bold>Supplementary Table S3</bold></xref>). The kinship matrix showed no clear-cut clustering in the panel of soybean accessions (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2E</bold></xref>). Besides, no distinct structure was observed, and a continuous distribution of the soybean accessions has been shown by the analysis of population structure (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2D</bold></xref>; <xref ref-type="supplementary-material" rid="SF11"><bold>Supplementary Table S3</bold></xref>).</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Marker allocation, population structure analysis and LD decay plot in the 340 soybean accessions. <bold>(A)</bold> SNP density plot of 20 soybean chromosomes involving 3,343,372 SNPs across the GWAS panel. Horizontal axis shows the length of chromosomes in Mb, and vertical axis represents the chromosome number; and the various colors depict the chromosome density. <bold>(B)</bold> Distribution of 3,343,372 SNPs across the 20 different chromosomes of soybean. <bold>(C)</bold> LD decay plot generated from the 3,343,372 SNPs in the GWAS panel. Blue thick line corresponds to LD decay fitted with a smoothing spline regression model. The intersection of the horizontal and vertical dotted lines on the LD decay curve represents the LD half decay (<italic>r<sup>2</sup></italic>&#xa0;=&#xa0;0.34) and the genetic distance at half decay point is 71.7 kb. <bold>(D)</bold> PCA analysis displays the organization of the 340 accessions of soybean derived from different regions of northeast China. <bold>(E)</bold> Kinship plot displays the relationship among the panel of 340 soybean accessions.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767299-g002.tif">
<alt-text content-type="machine-generated">Figure composed of five panels labeled A to E. Panel A: Heatmap illustrating the number of SNPs within 1 megabase window sizes across 20 chromosomes, with color gradient representing SNP density from low (gray) to high (red). Panel B: Bar chart displaying SNP counts per chromosome, with each chromosome represented by a distinct color. Panel C: Line graph showing the decay of linkage disequilibrium (r-squared) as a function of distance, marking a specific point at 71.7 base pairs and r-squared value 0.34. Panel D: 3D principal component analysis scatter plot, color-coded by group, displaying genetic diversity among individuals. Panel E: Hierarchical clustering heatmap showing genetic relationships, with the dendrogram indicating clustering patterns.</alt-text>
</graphic></fig>
<p>We studied the features of LD across the panel of 340 diverse soybean accessions, and the outcomes are revealed in the graph (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2C</bold></xref>). The average value of <italic>r<sup>2</sup></italic> was 0.32, with LD decay started at 0.68; the half decay reached at 0.34. The intersection occurs between the LD decay curve and half decay at the 71.7 kb; and this distance decides the linkage at the genome-wide level. The genomic region of &#xb1; 71.7 kb across the stable significant SNPs was designated as the QTL interval.</p>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>GWAS analysis of SOC and SPC</title>
<p>Here, we detected 105 and 59 significant SNPs linked with the SOC and SPC traits, respectively across the four individual environments (CC22, CC23, CC24 &amp; JT24) plus CE and seven GWAS models (<xref ref-type="fig" rid="f3"><bold>Figures&#xa0;3</bold></xref>, <xref ref-type="fig" rid="f4"><bold>4</bold></xref>; <xref ref-type="supplementary-material" rid="SF12"><bold>Supplementary Table S4</bold></xref>). The 105 significant SNPs of SOC were distributed across all the soybean chromosomes except Chr.07 and Chr.15; and the allocation of these SNPs in the various models and environments were presented in UpSet plot (<xref ref-type="fig" rid="f5"><bold>Figures&#xa0;5A, B</bold></xref>). A maximum of 33 significant SNPs of SOC were present on Chr.08, and a minimum of one significant SNP was identified on Chr.16 and Chr. 20. The remaining 15 chromosomes possessed significant SNPs in the range of 2 to 15 (<xref ref-type="supplementary-material" rid="SF12"><bold>Supplementary Table S4</bold></xref>). By considering the detection of SOC related significant SNPs by various GWAS models, the one SNP viz., Chr08_9071263 was persistently identified by all the seven models viz., GLM, MLM, CMLM, MLMM, SUPER, FarmCPU and BLINK; the rest of the 104 SOC related significant SNPs were identified by one to five GWAS models (<xref ref-type="supplementary-material" rid="SF12"><bold>Supplementary Table S4</bold></xref>). Furthermore, the SNP Chr08_9071263 was persistently identified by three single environments plus CE. The SNPs viz., Chr08_9054741, Chr08_9056324 and Chr08_9071236 were persistently detected in two single environments plus CE; and Chr09_6929070, Chr10_44584365, Chr10_44584422 and Chr15_10147967 were detected by two single environments or one single environment plus CE. The rest of the 97 SOC related significant SNPs were identified in one single environment or CE (<xref ref-type="supplementary-material" rid="SF12"><bold>Supplementary Table S4</bold></xref>).</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Illustration reveals the GWAS signals of SOC across various GWAS models and environments. The different models include GLM, MLM, CMLM, MLMM, BLINK, SUPER and FarmCPU; and different single environments include CC22, CC23, CC24 &amp; JT24 plus CE. <bold>(A&#x2013;E)</bold> represents the Manhattan plots in various environments viz., <bold>(A)</bold> CC22, <bold>(B)</bold> CC23, <bold>(C)</bold> CC24, <bold>(D)</bold> JT24 and <bold>(E)</bold> CE. <bold>(F&#x2013;J)</bold> represents the quantile&#x2013;quantile (Q&#x2013;Q) plots in various environments viz., <bold>(F)</bold> CC22, <bold>(G)</bold> CC23, <bold>(H)</bold> CC24, <bold>(I)</bold> JT24 and <bold>(J)</bold> CE. Significant threshold level [-log<sub>10</sub><italic>P</italic>&gt; 6.52] is shown by the black horizontal dotted line. The number along the X-axis corresponds to different chromosomes. In the Manhattan plot and Q-Q plot different colors of dots correspond to various GWAS models.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767299-g003.tif">
<alt-text content-type="machine-generated">Ten-panel figure displaying Manhattan plots (A-E) and corresponding Q-Q plots (F-J) for genome-wide association studies using six statistical methods, distinguished by color. Manhattan plots show genomic position by chromosome on the x-axis and negative log P-values on the y-axis, with a horizontal significance threshold. Q-Q plots depict observed versus expected negative log P-values, comparing method distributions. Each method's results cluster visually, allowing evaluation of significance and deviation for each trait or statistical model tested.</alt-text>
</graphic></fig>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Illustration is revealing the GWAS signals of SPC across various GWAS models and environments. The different models include GLM, MLM, CMLM, MLMM, BLINK, SUPER and FarmCPU; and different single environments include CC22, CC23, CC24 &amp; JT24 plus CE. <bold>(A-E)</bold> represents the Manhattan plots in various environments viz., <bold>(A)</bold> CC22, <bold>(B)</bold> CC23, <bold>(C)</bold> CC24, <bold>(D)</bold> JT24 and <bold>(E)</bold> CE. <bold>(F&#x2013;J)</bold> represents the quantile&#x2013;quantile (Q&#x2013;Q) plots in various environments viz., <bold>(F)</bold> CC22, <bold>(G)</bold> CC23, <bold>(H)</bold> CC24, <bold>(I)</bold> JT24 and <bold>(J)</bold> CE. Significant threshold level [-log<sub>10</sub><italic>P</italic>&gt; 6.67] is shown by the black horizontal dotted line. The number along the X-axis corresponds to different chromosomes. In the Manhattan plot and Q-Q plot different colors of dots correspond to various GWAS models.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767299-g004.tif">
<alt-text content-type="machine-generated">Ten-panel scientific figure showing five Manhattan plots (A&#x2013;E) and five QQ plots (F&#x2013;J). Manhattan plots display &#x2013;log10(p) values of genetic associations across chromosomes one to twenty, with results from GLM, MLM, CMLM, MLMM, super, FarmCPU, and BLINK methods differentiated by color. QQ plots compare observed versus expected &#x2013;log10(p) for the same methods, illustrating deviation from the null hypothesis for each association test.</alt-text>
</graphic></fig>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>UpSet plots depicting intersection of significant SNPs of SOC and SPC across models and environments. The GWAS models include GLM, MLM, CMLM, MLMM, SUPER, FarmCPU and BLINK; and environments include CC22, CC23, CC24, JT24 &amp; CE. <bold>(A)</bold> UpSet plot demonstrating the intersection of significant SNPs of SOC across various environments. <bold>(B)</bold> UpSet plot demonstrating the intersection of significant SNPs of SOC across various GWAS models. <bold>(C)</bold> UpSet plot demonstrating the intersection of significant SNPs of SPC across various environments. <bold>(D)</bold> UpSet plot demonstrating the intersection of significant SNPs of SPC across various GWAS models.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767299-g005.tif">
<alt-text content-type="machine-generated">Figure containing four grouped bar and dot charts labeled A, B, C, and D, each showing the intersection of SNP numbers for various traits analyzed by different environments and models. Bar graphs on the left of each panel display SNP counts per environment or model, while vertical blue bars show unique and overlapping SNP counts. Panel A and B are labeled SOC, panels C and D are labeled SPC, indicating two traits. Black dots mark intersections, and values are annotated above bars for emphasis.</alt-text>
</graphic></fig>
<p>The 59 significant SNPs detected for the SPC were distributed across the 17 out of total 20 soybean chromosomes viz., Chr.01, Chr.02, Chr.03, Chr.05, Chr.06, Chr.07, Chr.08, Chr.09, Chr.10, Chr.12, Chr.13, Chr.14, Chr.15, Chr.16, Chr.17, Chr.18 and Chr.20; no significant SNPs for the SPC were detected on the Chr.04, Chr.11 and Chr.19 (<xref ref-type="supplementary-material" rid="SF12"><bold>Supplementary Table S4</bold></xref>). Distribution of these 59 SNPs across the different GWAS models and environments is presented in the UpSet plot (<xref ref-type="fig" rid="f5"><bold>Figures&#xa0;5C, D</bold></xref>). We detected a maximum of eight SNPs on the Chr.18, and a minimum of one significant SNP on the chromosomes viz., Chr.07, Chr.10 and Chr.14; and the remaining 14 chromosomes possess the significant SNPs from two to six (<xref ref-type="supplementary-material" rid="SF12"><bold>Supplementary Table S4</bold></xref>). The significant SNPs for the SPC were distributed across the different models as, the SNPs viz., Chr08_9054741 and Chr18_54408341 were detected by all the seven GWAS models, this is followed by SNP Chr18_54376853 that was detected by five models viz., GLM, MLMM, super, FarmCPU and BLINK; the remaining 56 SNPs were detected by one to three GWAS models (<xref ref-type="supplementary-material" rid="SF12"><bold>Supplementary Table S4</bold></xref>). Moreover, the SNPs viz., Chr18_54408341 was detected by two single environments (CC22 &amp; CC23) plus CE; and the SNPs viz., Chr01_11010539, Chr06_6762512 and Chr08_9054741 were detected by one single environment plus CE. The rest of the 55 SPC related SNPs were identified in one single environment or CE (<xref ref-type="supplementary-material" rid="SF12"><bold>Supplementary Table S4</bold></xref>).</p>
<p>However, among the total of 105 and 59 SNPs detected to be associated with SOC and SPC, respectively; only three significant SNPs viz., Chr08_9054741, Chr08_9071236 and Chr08_9071263 were associated with both SOC and SPC (<xref ref-type="supplementary-material" rid="SF12"><bold>Supplementary Table S4</bold></xref>). The effect of Chr08_9054741 was negative on both SOC (-1.34) and SPC (-2.04) traits, whereas the effect of Chr08_9071236 was positive on both SOC (1.35) and SPC (1.76); moreover, the effect of Chr08_9071263 was positive on SOC (1.32) as well as SPC (1.94). These results indicate that these three common SNPs govern the SOC and SPC traits in the same direction. The remaining SNPs were associated with either SOC or SPC (<xref ref-type="supplementary-material" rid="SF12"><bold>Supplementary Table S4</bold></xref>).</p>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Superior haplotypes for SOC and SPC</title>
<p>The significant SNPs present in the same chromosome that were associated with the same trait or related traits, and were fitting into the LD decay range of &#xb1; 71.7 kb formed the haplotype blocks. Besides, the SNPs identified through different GWAS models but fell within the physical interval of &#xb1; 71.7 kb were also used for haplotype block construction. In this regard, our findings revealed that two, three, two, two, three, three, twenty-six, three, eleven, two, two, two, five, two and two significant SNPs associated with the SOC or/and SPC were present on the chromosomes viz., Chr.01, Chr.06, Chr.06, Chr.08, Chr.08, Chr.08, Chr.08, Chr.09, Chr.10, Chr.12, Chr.15, Chr.15, Chr.18, Chr.18 and Chr.20, respectively and are fitting into the half LD decay distance; therefore, they constituted 15 haplotype blocks viz., Hap-1, Hap-6.1, Hap-6.2, Hap-8.1, Hap-8.2, Hap-8.3, Hap-8.4, Hap-9, Hap-10, Hap-12, Hap-15.1, Hap-15.2, Hap-18.1, Hap-18.2 and Hap-20, respectively (<xref ref-type="fig" rid="f6"><bold>Figures&#xa0;6</bold></xref>, <xref ref-type="fig" rid="f7"><bold>7</bold></xref>; <xref ref-type="supplementary-material" rid="SF13"><bold>Supplementary Table S5</bold></xref>).</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Analysis of 14 haplotype blocks associated with the SOC across the 340 accessions of soybean. <bold>(A)</bold> Hap-1, <bold>(B)</bold> Hap-6.1, <bold>(C)</bold> Hap-6.2, <bold>(D)</bold> Hap-8.1, <bold>(E)</bold> Hap-8.2, <bold>(F)</bold> Hap-8.3, <bold>(G)</bold> Hap-8.4, <bold>(H)</bold> Hap-9, <bold>(I)</bold> Hap-10, <bold>(J)</bold> Hap-15.1, <bold>(K)</bold> Hap-15.2, <bold>(L)</bold> Hap-18.2, <bold>(M)</bold> Hap-18.2, and <bold>(N)</bold> Hap-20. Haplotype allele number ranges from two to four across the 14 blocks in the soybean germplasm governing the SOC from the minimum to maximum levels through intermediate phenotypes. The different letters at the top of density curve correspond to differences at the significant level, whereas the same letters correspond to differences at the non-significant levels.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767299-g006.tif">
<alt-text content-type="machine-generated">Grouped violin plots labeled panels A to N compare SOC values across different haplotypes, with each panel showing distinct color-coded groups, boxplots inside violins, dot plots for data points, and statistical significance indicated by superscript letters above each group.</alt-text>
</graphic></fig>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Analysis of 11 haplotype blocks associated with the SPC across the 340 accessions of soybean. <bold>(A)</bold> Hap-1, <bold>(B)</bold> Hap-6.1, <bold>(C)</bold> Hap-6.2, <bold>(D)</bold> Hap-8.1, <bold>(E)</bold> Hap-8.2, <bold>(F)</bold> Hap-8.3, <bold>(G)</bold> Hap-8.4, <bold>(H)</bold> Hap-12, <bold>(I)</bold> Hap-15.2, <bold>(J)</bold> Hap-18.1, and <bold>(K)</bold> Hap-20. Haplotype allele number ranges from two to four across the 11 blocks in the soybean germplasm governing the SPC from the minimum to maximum levels through intermediate phenotypes. The different letters at the top of density curve correspond to differences at the significant level, whereas the same letters correspond to differences at the non-significant levels.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767299-g007.tif">
<alt-text content-type="machine-generated">Violin plots in panels A to K compare SPC values across different haplotypes, labeled on the x-axes. Colors differentiate haplotypes, and lowercase letters above violins indicate statistically significant differences between groups.</alt-text>
</graphic></fig>
<p>The number of haplotype alleles of these 15 haplotype blocks varied from two (Hap-1) to four (Hap-6.1) (<xref ref-type="fig" rid="f6"><bold>Figures&#xa0;6</bold></xref>, <xref ref-type="fig" rid="f7"><bold>7</bold></xref>; <xref ref-type="supplementary-material" rid="SF13"><bold>Supplementary Table S5</bold></xref>). Out of 15 haplotype blocks, the haplotype alleles of 14 blocks viz., Hap-1, Hap-6.1, Hap-6.2, Hap-8.1, Hap-8.2, Hap-8.3, Hap-8.4, Hap-9, Hap-10, Hap-15.1, Hap-15.2, Hap-18.1, Hap-18.2 and Hap-20 revealed differences at the significant level in the governing of SOC that varied from 16.68-21.15% (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6</bold></xref>; <xref ref-type="supplementary-material" rid="SF13"><bold>Supplementary Table S5</bold></xref>). In contrast, the haplotype alleles of 11 out of total 16 haplotype blocks viz., Hap-1, Hap-6.1, Hap-6.2, Hap-8.1, Hap-8.2, Hap-8.3, Hap-8.4, Hap-12, Hap-15.2, Hap-18.1, and Hap-20 revealed differences at the significant levels in the governing of SPC that varied from 38.63-42.69%; whereas the haplotype alleles of the remaining four haplotype blocks viz., Hap-9, Hap-10, Hap-15.2, and Hap-18.1 showed differences at the non-significant levels in the governing of SPC (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7</bold></xref>; <xref ref-type="supplementary-material" rid="SF13"><bold>Supplementary Table S5</bold></xref>).</p>
<p>In conclusion, the haplotype alleles of 14 and 11 haplotype blocks associated with SOC and SPC, respectively, regulate the different phenotypes of these two traits ranging from low-intermediate-high.</p>
</sec>
<sec id="s3_5">
<label>3.5</label>
<title>Stable QTL identification of SOC and SPC</title>
<p>Multiple significant SNPs were detected in different environments and models across the LD decay (&#xb1; 71.7 kb) distance of 15 haplotype blocks viz., Hap-1, Hap-6.1, Hap-6.2, Hap-8.1, Hap-8.2, Hap-8.3, Hap-8.4, Hap-9, Hap-10, Hap-12, Hap-15.1, Hap-15.2, Hap-18.1, Hap-18.2 and Hap-20, hence they also represented the 15 stable QTLs named as <italic>qSOC1</italic>, <italic>qSOC_SPC6.1</italic>, <italic>qSOC_SPC6.2</italic>, <italic>qSOC8.1</italic>, <italic>qSOC8.2</italic>, <italic>qSOC8.3</italic>, <italic>qSOC_SPC8</italic>, <italic>qSOC9</italic>, <italic>qSOC10</italic>, <italic>qSPC12</italic>, <italic>qSOC_SPC15.1</italic>, <italic>qSOC_SPC15.2</italic>, <italic>qSPC18</italic>, <italic>qSOC18</italic> and <italic>qSPC20</italic> (<xref ref-type="supplementary-material" rid="SF12"><bold>Supplementary Table S4</bold></xref>; <xref ref-type="supplementary-material" rid="SF2"><bold>Supplementary Figure&#xa0;2</bold></xref>). Besides, the genomic intervals of &#xb1; half LD-decay distance across the SNPs detected by various models and environments such as Chr01_11010539 and Chr15_10147967, which were present on Chr.01 and Chr.15, respectively, were defined as stable QTLs. They represent two QTLs referred to as <italic>qSPC1</italic> and <italic>qSOC15</italic>, respectively (<xref ref-type="supplementary-material" rid="SF12"><bold>Supplementary Table S4</bold></xref>). Hence, together we identified a total of 17 QTLs; among these QTLs, the eight viz., <italic>qSOC1</italic>, <italic>qSOC8.1</italic>, <italic>qSOC8.2</italic>, <italic>qSOC8.3</italic>, <italic>qSOC9</italic>, <italic>qSOC10</italic>, <italic>qSOC15</italic> and <italic>qSOC18</italic> were associated with the SOC trait only, whereas the four QTLs viz., <italic>qSPC1</italic>, <italic>qSPC12</italic>, <italic>qSPC18</italic>, and <italic>qSPC20</italic> were associated with only SPC trait. However, the five QTLs viz., <italic>qSOC_SPC6.1</italic>, <italic>qSOC_SPC6.2</italic>, <italic>qSOC_SPC8</italic>, <italic>qSOC_SPC15.1</italic> and <italic>qSOC_SPC15.2</italic> were linked with both SOC and SPC traits (<xref ref-type="supplementary-material" rid="SF12"><bold>Supplementary Table S4</bold></xref>; <xref ref-type="supplementary-material" rid="SF2"><bold>Supplementary Figure&#xa0;2</bold></xref>). The above genomic loci/QTLs were identified through various environments and GWAS models, that in turn indicates the persistency and stability of these genomic loci in the governing of SOC or/and SPC.</p>
<p>To quantify the genetic basis underlying the observed phenotypic correlation between SOC and SPC, we performed a linear regression analysis to evaluate the phenotypic variance explained (PVE) by the identified stable QTLs based on the phenotypic data from the CE (<xref ref-type="supplementary-material" rid="SF14"><bold>Supplementary Table S6</bold></xref>). The five major pleiotropic QTL regions (<italic>qSOC_SPC6.1</italic>, <italic>qSOC_SPC6.2</italic>, <italic>qSOC_SPC8</italic>, <italic>qSOC_SPC15.1</italic> and <italic>qSOC_SPC15.2</italic>) were found to collectively account for 26.19% of the total variance for SOC and 22.26% for SPC. This indicated that around a quarter portion of the variation in both traits was governed by shared genomic &#x201c;hotspots&#x201d;. Furthermore, the other six stable QTLs of which the haplotype blocks exhibited significant individual effects on both traits (<italic>qSOC1</italic>, <italic>qSOC8.1</italic>, <italic>qSOC8.2</italic>, <italic>qSOC8.3</italic>, <italic>qSPC18</italic> and <italic>qSPC20</italic>) explained a total PVE of 22.17% for SOC and 29.49% for SPC. These 11 QTLs explained 48.36% of the phenotypic variance of SOC and 51.74% of SPC, respectively. The remaining phenotypic residuals (~31%) likely reflected the influence of numerous sub-threshold minor-effect loci and environmental factors. These results provide a genetic explanation for the significant correlation between SOC and SPC observed in our germplasm.</p>
</sec>
<sec id="s3_6">
<label>3.6</label>
<title>Candidate gene identification for SOC and SPC</title>
<p>Here, we identified 353 model genes across the genomic intervals of 17 QTLs viz., <italic>qSPC1</italic>, <italic>qSOC1</italic>, <italic>qSOC_SPC6.1</italic>, <italic>qSOC_SPC6.2</italic>, <italic>qSOC8.1</italic>, <italic>qSOC8.2</italic>, <italic>qSOC8.3</italic>, <italic>qSOC_SPC8</italic>, <italic>qSOC9</italic>, <italic>qSOC10</italic>, <italic>qSPC12</italic>, <italic>qSOC15, qSOC_SPC15.1</italic>, <italic>qSOC_SPC15.2</italic>, <italic>qSPC18</italic>, <italic>qSOC18</italic> and <italic>qSPC20</italic>, that include 5, 15, 28, 24, 21, 19, 25, 41, 9, 30, 37, 13, 11, 22, 25, 14 and 14 genes, respectively. The gene ontology (GO) analysis was carried out by utilizing the online available web-based toolkit viz., agriGO V2.0; and this analysis showed the enrichment of various terms among the major categories viz., molecular function, biological process and cellular component within the 17 genomic loci linked with SOC and SPC traits (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8A</bold></xref>). The terms with the highest enrichment across the 17 QTLs are shown in <xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8A</bold></xref>. The gene expression levels of model genes residing in the physical intervals of 17 QTLs across the various tissues/organs and seed development stages of soybean are presented in the form of heatmap (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8B</bold></xref>). By using the <italic>in-silico</italic> analysis viz., function annotations, transcriptomic analysis and literature survey, we sorted out 121 genes across the genomic interval of 17 QTLs as possible candidates governing SOC and SPC traits in soybean (<xref ref-type="supplementary-material" rid="SF15"><bold>Supplementary Table S7</bold></xref>). These include 3, 5, 11, 9, 11, 7, 7, 14, 3, 6, 5, 6, 4, 4, 8, 10, and 8 candidate genes across the physical interval of 17 QTLs viz., <italic>qSPC1</italic>, <italic>qSOC1</italic>, <italic>qSOC_SPC6.1</italic>, <italic>qSOC_SPC6.2</italic>, <italic>qSOC8.1</italic>, <italic>qSOC8.2</italic>, <italic>qSOC8.3</italic>, <italic>qSOC_SPC8</italic>, <italic>qSOC9</italic>, <italic>qSOC10</italic>, <italic>qSPC12</italic>, <italic>qSOC15, qSOC_SPC15.1</italic>, <italic>qSOC_SPC15.2</italic>, <italic>qSPC18</italic>, <italic>qSOC18</italic> and <italic>qSPC20</italic>, respectively (<xref ref-type="supplementary-material" rid="SF15"><bold>Supplementary Table S7</bold></xref>). Gene function annotations such as amino acid biosynthesis, protein biosynthesis, amino acid and protein transport, fatty acid biosynthesis, lipid biosynthesis, fatty acid and lipid transport as well as processes related to the protein and lipid biosynthesis and their accumulation, and seed development (<xref ref-type="supplementary-material" rid="SF15"><bold>Supplementary Table S7</bold></xref>), and genes showing higher expression (as showed by RNA-seq dataset) during the seed development stages were the main criteria to select the candidate genes (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8B</bold></xref>). These 121 genes were regarded as putative candidates for regulating the SOC and SPC in soybean.</p>
<fig id="f8" position="float">
<label>Figure&#xa0;8</label>
<caption>
<p><italic>In-silico</italic> analysis of model genes occurring across the genomic interval of 17 QTLs. <bold>(A)</bold> This figure corresponds to gene ontology (GO) enrichment analysis of model genes for the terms belonging to three major categories viz., cellular component, biological process and metabolic function; and <bold>(B)</bold> This figure displays the expression pattern of the model genes present across the physical interval of 17 QTLs using the RNA-seq data; and the expression results are presented for the different development stages and tissues such as leaf, flower, pod and seed of soybean plant.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767299-g008.tif">
<alt-text content-type="machine-generated">Panel A displays a grouped bar chart categorizing gene numbers by Gene Ontology terms, with bars colored by Biological Process, Cellular Component, and Molecular Function. Panel B presents a heatmap showing gene expression levels across various seed tissues, seed tissue types, and developmental stages, annotated with color-coded legends identifying expression levels, tissue types, and developmental stages.</alt-text>
</graphic></fig>
<p>To further screen out the genes regulating the SOC and SPC traits, we performed the sequence variation analysis, variant annotation analysis and haplotype analysis. Out of these 121 genes, only 104 genes showed sequence variations (<xref ref-type="supplementary-material" rid="SF16"><bold>Supplementary Table S8</bold></xref>). Among these 104 genes, the haplotype alleles of 80 genes revealed differences at significant levels in governing the SOC or/and SPC (<xref ref-type="supplementary-material" rid="SF17"><bold>Supplementary Tables S9</bold></xref>). In these 80 genes, the haplotype allele number varied from a minimum of two to the maximum of 8, regulating the SOC and SPC in the ranges of 15.98-21.23% and 37.69%-43.30%, respectively. Among these 80 genes, the haplotype alleles of 11 genes only showed differences at the significant levels in governing the SOC, whereas the haplotype alleles of 6 genes only showed differences at the significant levels in governing the SPC. However, in the remaining 63 genes (out of the total 80) the haplotype alleles revealed differences at the significant levels in governing of both SOC and SPC. The haplotype alleles of these 80 genes regulate the different phenotypes of SOC or SPC or both traits ranging from minimum to maximum levels through intermediate phenotypes. The variant annotation analysis showed that 45 of the 80 genes showed non-synonymous mutations, whereas the remaining 35 genes showed synonymous mutations (<xref ref-type="supplementary-material" rid="SF16"><bold>Supplementary Table S8</bold></xref>). Hence, these 80 genes were prioritized as candidate genes governing the SOC and SPC traits in soybean (<xref ref-type="supplementary-material" rid="SF17"><bold>Supplementary Table S9</bold></xref>).</p>
<p>Furthermore, we performed haplotype selection analysis of the soybean accessions adapted to different latitudes i.e., from low-latitude to high-latitude for these 80 genes using the public data from the SoyMD (<ext-link ext-link-type="uri" xlink:href="https://yanglab.hzau.edu.cn/SoyMD/#/">https://yanglab.hzau.edu.cn/SoyMD/#/</ext-link>; <xref ref-type="supplementary-material" rid="SF3"><bold>Supplementary Figures&#xa0;3</bold></xref>-<xref ref-type="supplementary-material" rid="SF8"><bold>8</bold></xref>). Our haplotype results showed that 12 genes viz., <italic>Glyma.01G175500</italic>, <italic>Glyma.01G176000</italic>, <italic>Glyma.08G101100</italic>, <italic>Glyma.08G101900</italic>, <italic>Glyma.08G103100</italic>, <italic>Glyma.08G111700</italic>, <italic>Glyma.08G111800</italic>, <italic>Glyma.08G117000</italic>, <italic>Glyma.15G232200</italic>, <italic>Glyma.18G258000</italic>, <italic>Glyma.18G258100</italic>, <italic>Glyma.18G259100</italic> underwent divergent selection for the specific haplotypes across the soybean population adapted to different latitudes (<xref ref-type="table" rid="T2"><bold>Table&#xa0;2</bold></xref>; <xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9</bold></xref>). For example, in <italic>Glyma.01G175500</italic>, the Hap_001 was predominantly selected in soybeans in Northeast China, whereas Hap_002 was predominantly selected in soybeans from southern parts of China. In the same way, the divergent specific haplotypes have been selected for the low- and high-latitude soybeans in the remaining 11 genes (<xref ref-type="table" rid="T2"><bold>Table&#xa0;2</bold></xref>). Moreover, the <italic>F<sub>ST</sub></italic>, <italic>&#x3c0;</italic> and Tajima&#x2019;s <italic>D</italic> analysis also revealed the differential/divergent selection of these 12 genes among the soybean populations adapted to different latitudes (<xref ref-type="supplementary-material" rid="SF3"><bold>Supplementary Figures&#xa0;3</bold></xref>-<xref ref-type="supplementary-material" rid="SF8"><bold>8</bold></xref>). Hence, these 12 genes are the most potential candidates regulating the difference in the SOC and SPC traits in the soybeans adapted to the environment of Northeast China.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Description of the 12 divergently selected genes across the different latitudes.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Gene</th>
<th valign="middle" align="left">Orthologous gene in Arabidposis</th>
<th valign="middle" align="left">Function annotation</th>
<th valign="middle" align="left">Haplotypes selected in high-latitudes</th>
<th valign="middle" align="left">Haplotype selected in low-latitudes</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left"><italic>Glyma.01G175500</italic></td>
<td valign="middle" align="left"><italic>AT3G50660.1 (CYP90B1);</italic> Cytochrome P450 superfamily protein</td>
<td valign="middle" align="left">Sterol biosynthetic process; unidimensional cell growth</td>
<td valign="middle" align="left">Hap-001</td>
<td valign="middle" align="left">Hap-002</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>Glyma.01G176000</italic></td>
<td valign="middle" align="left"><italic>AT4G36630.1 (EMB2754);</italic> Vacuolar sorting protein 39</td>
<td valign="middle" align="left">Embryo development ending in seed dormancy; intracellular protein transport; protein N-linked glycosylation; protein glycosylation; protein targeting to vacuole</td>
<td valign="middle" align="left">Hap-001</td>
<td valign="middle" align="left">Hap-002</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>Glyma.08G101100</italic></td>
<td valign="middle" align="left"><italic>AT1G67680.1;</italic> SRP72 RNA-binding domain</td>
<td valign="middle" align="left">SRP-dependent cotranslational protein targeting to membrane</td>
<td valign="middle" align="left">Hap-001, Hap-003</td>
<td valign="middle" align="left">Hap-002</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>Glyma.08G101900</italic></td>
<td valign="middle" align="left"><italic>AT5G40780.1;</italic> lysine histidine transporter 1</td>
<td valign="middle" align="left">ER to Golgi vesicle-mediated transport; N-terminal protein myristoylation; amino acid import; amino acid transport; ammonium transport; anion transport; basic amino acid transport.</td>
<td valign="middle" align="left">Hap-001</td>
<td valign="middle" align="left">Hap-002</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>Glyma.08G103100</italic></td>
<td valign="middle" align="left"><italic>AT1G24330.1;</italic> ARM repeat superfamily protein</td>
<td valign="middle" align="left">Protein ubiquitination</td>
<td valign="middle" align="left">Hap-001, Hap-002</td>
<td valign="middle" align="left">Hap-003, Hap-004</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>Glyma.08G111700</italic></td>
<td valign="middle" align="left"><italic>AT5G55160.1 (SUM2/SUMO 2);</italic> small ubiquitin-like modifier 2</td>
<td valign="middle" align="left">Gluconeogenesis; methionine biosynthetic process; proteasomal protein catabolic process; protein sumoylation;</td>
<td valign="middle" align="left">Hap-002</td>
<td valign="middle" align="left">Hap-001</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>Glyma.08G111800</italic></td>
<td valign="middle" align="left"><italic>AT5G55160.1 (SUM2/SUMO 2);</italic> small ubiquitin-like modifier 2</td>
<td valign="middle" align="left">Gluconeogenesis; methionine biosynthetic process; proteasomal protein catabolic process; protein sumoylation; response to heat</td>
<td valign="middle" align="left">Hap-002</td>
<td valign="middle" align="left">Hap-001, Hap-003</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>Glyma.08G117000</italic></td>
<td valign="middle" align="left"><italic>AT5G45800.1 (MEE62);</italic> Leucine-rich repeat protein kinase family protein</td>
<td valign="middle" align="left">Embryo development ending in seed dormancy; protein phosphorylation; transmembrane receptor protein tyrosine kinase signaling pathway</td>
<td valign="middle" align="left">Hap-001</td>
<td valign="middle" align="left">Hap-002, Hap-003</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>Glyma.15G232200</italic></td>
<td valign="middle" align="left"><italic>AT3G56710.1 (SIB1);</italic> sigma factor binding protein 1</td>
<td valign="middle" align="left">MAPK cascade; cellular response to nitrogen starvation; defense response, incompatible interaction.</td>
<td valign="middle" align="left">Hap-002</td>
<td valign="middle" align="left">Hap-001</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>Glyma.18G258000</italic></td>
<td valign="middle" align="left"><italic>AT3G29590.1 (AT5MAT);</italic> HXXXD-type acyl-transferase family protein</td>
<td valign="middle" align="left">anthocyanin-containing compound biosynthetic process; response to UV-B; response to sucrose stimulus</td>
<td valign="middle" align="left">Hap-001, Hap-003</td>
<td valign="middle" align="left">Hap-002</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>Glyma.18G258100</italic></td>
<td valign="middle" align="left"><italic>AT3G49190.1;</italic> O-acyltransferase (WSD1-like) family protein</td>
<td valign="middle" align="left">diacylglycerol O-acyltransferase activity</td>
<td valign="middle" align="left">Hap-001</td>
<td valign="middle" align="left">Hap-003, Hap-005</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>Glyma.18G259100</italic></td>
<td valign="middle" align="left"><italic>AT3G28910.1 (ATMYB30, MYB3);</italic> myb domain protein 30</td>
<td valign="middle" align="left">response to auxin stimulus; very long-chain fatty acid biosynthetic process</td>
<td valign="middle" align="left">Hap-001</td>
<td valign="middle" align="left">Hap-002, Hap-005</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="f9" position="float">
<label>Figure&#xa0;9</label>
<caption>
<p>Distribution of different haplotypes of <italic>Glyma.01G175500</italic> across soybeans adapted to different regions. <bold>(A)</bold> Hap_001 was selected preferentially for the soybean adapted to low-latitudes, and Hap_002 was selected preferentially for the high-latitude adapted soybeans. <bold>(B)</bold><italic>F<sub>ST</sub></italic>, <italic>&#x3c0;</italic> and Tajima&#x2019;s <italic>D</italic> analysis revealing differential/divergent selection of <italic>Glyma.01G175500</italic> among the soybean populations adapted to different latitudes. The soybean production regions in China are divided into China-I, China-II, China-III, China-IV, China-V and China-VI following <xref ref-type="bibr" rid="B45">Liu et&#xa0;al. (2023)</xref>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1767299-g009.tif">
<alt-text content-type="machine-generated">Map of China with regions labeled China-I through China-VI, overlaid with pie charts showing proportions of different haplotypes by color. Legend identifies haplotypes Hap_001 to Hap_008 and Others. Below, panel B displays three line graphs with comparative genetic measures (Fst, &#x3c0;, and Tajima&#x2019;s D) along the x-axis position for each labeled region, color-coded to match the map.</alt-text>
</graphic></fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>The SOC and SPC are the two crucial traits governing the quality and yield in soybean. Development of soybean cultivars with high SOC and SPC is the central objective of soybean researchers. However, it has been documented that soybeans in Northeast China have high SOC but low SPC compared to low-latitude soybeans (<xref ref-type="bibr" rid="B68">Rotundo et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B21">Guo et&#xa0;al., 2022</xref>). Little is known about the genetic mechanism regulating these differences in SOC and SPC traits in soybeans of Northeast China. Hence, there is a need to explore the genetic mechanism of these differences across the soybeans adapted to different latitudes. The amount of SOC and SPC in the global soybean germplasm varies from 8.10-27.10% and 34.1&#x2013;56.8%, respectively (<xref ref-type="bibr" rid="B82">Wang et&#xa0;al., 2025</xref>). In agreement, our study also showed that SOC and SPC varied from 13.59-24.67% and 31.72-50.83%, respectively in the Northeast China adapted soybean germplasm. Hence, a greater emphasis is needed to be put on the characterization of soybean germplasm for the SOC and SPC traits. The approaches of classical breeding have been earlier used to enhance the SOC and SPC in soybean; however, it has been documented that these breeding approaches have developed soybean cultivars with high SOC but at the cost of reduced SPC and vice versa (<xref ref-type="bibr" rid="B30">Karikari et&#xa0;al., 2019</xref>). In agreement, our study also reported a significant negative correlation between SOC and SPC (<xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1C</bold></xref>). The significant negative correlation between SOC and SPC has hindered the simultaneous improvement of these two traits in the same cultivar. Furthermore, the polygenic inheritance and environmental sensitiveness of the SOC and SPC traits make the conventional breeding unable to meet the demands (<xref ref-type="bibr" rid="B16">Duan et&#xa0;al., 2023</xref>). In this context, molecular breeding has promised to develop soybean cultivars with both high SOC and SPC especially by using the independent or non-correlated QTLs/genes (<xref ref-type="bibr" rid="B63">Patil et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B55">Moore Ronald et&#xa0;al., 2025</xref>). Hence, identifying the independent MTAs/QTLs/genes for these two traits, and their subsequent deployment in the breeding programs of soybean will break the negative correlation between SOC and SPC; thereby producing the soybean cultivars with both high SOC and SPC which is the long-term goal of soybean breeders. Hence, approaches of molecular breeding have increased ability and precision to develop improved cultivars in soybean (<xref ref-type="bibr" rid="B17">Duan et&#xa0;al., 2025</xref>). Here, we utilized combined strategy of GWAS, haplotype analysis, QTL analysis, and candidate gene analysis to elucidate the comprehensive genetic basis of SOC and SPC traits in soybeans in Northeast China.</p>
<sec id="s4_1">
<label>4.1</label>
<title>Phenotypic variability of the GWAS population</title>
<p>Here, a set of 340 diverse accessions of soybean was assessed for SOC and SPC traits at two locations viz., Changchun and Jiutai research farms, corresponding to the entire of four environments viz., CC22, CC23, CC24 and JT24 plus CE. The effects of <italic>G</italic>, <italic>E</italic> and <italic>G</italic> &#xd7; <italic>E</italic> interactions on the SOC and SPC traits were highly significant, which is in accordance with the findings documented by earlier authors (<xref ref-type="bibr" rid="B39">Li et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B26">Jin et&#xa0;al., 2023</xref>). These results in turn indicated the great potential of this soybean germplasm for the improvement of these traits; besides, the differences in the environmental variables among various environments have resulted in the different trait values of the SOC and SPC in the same set of soybean accessions. The higher value of <italic>H</italic> for the SOC and SPC traits indicated the same accessions of GWAS panel will perform alike if the same environmental conditions were provided. In agreement, many previous studies have reported similar outcomes for the SOC and SPC traits in soybean (<xref ref-type="bibr" rid="B39">Li et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B14">Diers et&#xa0;al., 2023</xref>; <xref ref-type="bibr" rid="B31">Kim et&#xa0;al., 2023</xref>). Moreover, highly significant <italic>G</italic>, <italic>E</italic> and <italic>G &#xd7; E</italic> interactions shown by SOC and SPC revealed their complex pattern of inheritance; and similar outcomes are reported by earlier researchers (<xref ref-type="bibr" rid="B26">Jin et&#xa0;al., 2023</xref>).</p>
</sec>
<sec id="s4_2">
<label>4.2</label>
<title>Dissecting the genetic basis of SOC and SPC traits using the GWAS approach</title>
<p>In recent years, GWAS has been routinely used in plant research for the elucidation of genetic basis of different traits; and the special thanks go to the progress done in genome sequencing and high-throughput genotyping (<xref ref-type="bibr" rid="B2">Alqudah et&#xa0;al., 2020</xref>). In soybean, GWAS is utilized to explore the genetic elements of multiple traits including the SOC and SPC (<xref ref-type="bibr" rid="B34">Lee et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B39">Li et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B26">Jin et&#xa0;al., 2023</xref>). Hence, the current study used the advanced SNP genotyping in the GWAS approach to unravel the genomic loci and genes for SOC and SPC traits in soybean. Here, we detected the significant association of 105 and 59 SNPs with the SOC and SPC, respectively across the multiple environments (CC22, CC23, CC24 &amp; JT24) plus CE and seven GWAS models. These 105 and 59 significant SNPs of SOC and SPC were located on the 18 and 17 chromosomes of soybean, respectively, indicating multigenic inheritance of both traits, i.e. regulated by multiple genes. In accordance with our findings, the previous research studies have also documented the similar results of SOC and SPC traits in soybean (<xref ref-type="bibr" rid="B26">Jin et&#xa0;al., 2023</xref>; <xref ref-type="bibr" rid="B15">Doszhanova et&#xa0;al., 2024</xref>). Among the 105 and 59 SNPs detected significantly associated with SOC and SPC traits, respectively; only three common significant SNPs were linked with both SOC and SPC viz., Chr08_9054741, Chr08_9071236 and Chr08_9071263, while the remaining significant SNPs were either associated with the SOC or SPC. The three common SNPs associated with both SOC and SPC traits indicated their pleiotropic effect on the two traits, that may be because these SNPs were associated with genes encoding the enzyme involved in the common metabolic pathways (<xref ref-type="bibr" rid="B19">Gao et&#xa0;al., 2024</xref>; <xref ref-type="bibr" rid="B76">Van et&#xa0;al., 2025</xref>).</p>
<p>Furthermore, our outcomes revealed substantial variation in the identification of significant SNPs by seven different models for both traits. For instance, the Chr08_9071263 linked with SOC was detected by all seven models; in comparison, only one GWAS model detected the 30 significant SNPs. Similarly, the significant SNPs viz., Chr08_9054741 and Chr18_54408341 of SPC were detected by all seven GWAS models, whereas 27 SNPs of SPC were detected by a single GWAS model. Similar results have been reported by the earlier studies for various crop plants including soybean (<xref ref-type="bibr" rid="B35">Leventhal et&#xa0;al., 2025</xref>), maize (<xref ref-type="bibr" rid="B28">Kaler et&#xa0;al., 2020</xref>) and wheat (<xref ref-type="bibr" rid="B51">Merrick et&#xa0;al., 2022</xref>). The reason to describe this phenomenon is because the various models of GWAS are built on divergent hypotheses involving different distribution characteristics of QTL effects; hence, this leads to the difference in SNP detection among various GWAS models (<xref ref-type="bibr" rid="B59">Odell et&#xa0;al., 2022</xref>).</p>
<p>The moderate negative phenotypic correlation between SOC and SPC might be explained at the genetic level because some of the SNPs, QTLs and haplotype blocks affecting both traits simultaneously. Besides, the effects of environment as well as <italic>G</italic> &#xd7; <italic>E</italic> were highly significant in the GWAS population that might have further resulted in the negative correlation. The correlation between SOC and SPC was underpinned by a substantial shared genetic basis, as evidenced by the collective PVE of approximately 26% and 22% by the major pleiotropic QTLs, respectively (<xref ref-type="supplementary-material" rid="SF14"><bold>Supplementary Table S6</bold></xref>). Considering the other six stable QTLs of which the haplotype blocks exhibited significant individual effects on both traits, the 11 detected QTLs explained 56.23% of the heritability of SOC and 65.50% of SPC, respectively. Our regression analysis showed that the detected stable QTLs have already explained more than half of the genetic commonality. This implies that the observed phenotypic linkage is not merely a localized phenomenon but the aggregate result of multiple stable genetic regions.</p>
<p>Besides, substantial variation has been observed for the SNPs detected for both traits across the different environments. In some genomic regions, a locus may surpass the significance threshold for one trait/environment while having a significance level below the threshold for the other one. These suggestive signals may show consistent peak patterns across both traits/environments, supporting shared genetic control, but might be masked by statistical corrections and <italic>G</italic> &#xd7; <italic>E</italic> interactions. These outcomes revealed that SOC and SPC traits are substantially influenced by the environment, hence supporting the highly significant <italic>G</italic> &#xd7; <italic>E</italic> reported in this study.</p>
</sec>
<sec id="s4_3">
<label>4.3</label>
<title>Superior haplotypes identified for optimizing the SOC and SPC in soybean</title>
<p>In the GWAS analysis, soybean researchers have mostly used biallelic SNP markers; and these biallelic markers are not able to detect the multiple alleles present across the diverse GWAS panel that might represent the superior and rare alleles, hence making this valuable genetic diversity unavailable for the crop improvement (<xref ref-type="bibr" rid="B23">He and Gai, 2023</xref>). Therefore, there is an important need for multiallelic markers in the GWAS analysis to trap these superior/rare alleles as well as non-linear variation across the diverse natural crop germplasm. In this context, multiallelic markers of haplotypes have promised to fix these challenges of biallelic SNP markers in the GWAS (<xref ref-type="bibr" rid="B5">Bhat et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B77">Voorrips and Tumino, 2022</xref>). Hence, these markers will make the considerable genetic diversity accessible for crop improvement (<xref ref-type="bibr" rid="B77">Voorrips and Tumino, 2022</xref>). In the last few years, some studies have identified the superior haplotypes for various traits in soybean such as traits related to yield (<xref ref-type="bibr" rid="B69">Shao et&#xa0;al., 2022</xref>), plant height (<xref ref-type="bibr" rid="B65">Qin et&#xa0;al., 2023</xref>) and salinity tolerance (<xref ref-type="bibr" rid="B62">Patil et&#xa0;al., 2016</xref>). Besides, superior haplotypes are also detected in other crop species such as in pigeonpea for water deficit tolerance (<xref ref-type="bibr" rid="B70">Sinha et&#xa0;al., 2020</xref>) and in rice for quality traits (<xref ref-type="bibr" rid="B1">Abbai et&#xa0;al., 2019</xref>). There are multiple mechanisms including selection, recombination and mutation that govern the haplotype variation across the diverse crop germplasm (<xref ref-type="bibr" rid="B25">Hellsten et&#xa0;al., 2013</xref>). Hence, identifying and utilizing the haplotypes in molecular breeding has a substantial impact in crop improvement (<xref ref-type="bibr" rid="B70">Sinha et&#xa0;al., 2020</xref>). Here, we identified a total of 15 haplotype blocks, and the haplotype alleles of 14 out of total 15 haplotype blocks showed differences at the significant levels in the governing of SOC, whereas among the 15 haplotype blocks, the haplotype alleles of 11 blocks revealed differences at the significant levels in the governing of SPC. The haplotype alleles of these 15 blocks vary from two to four regulating the SOC or SPC from the low-intermediate-high levels. Among the 15 haplotype blocks, the haplotype alleles of Hap-1, Hap-8.2, Hap-8.3, Hap-8.4, showed positive correlation in the regulation of SOC and SPC; whereas the haplotype alleles of Hap-6.2, Hap-15.2 and Hap-20 showed negative correlation in the regulation of the SOC and SPC traits. However, the haplotype alleles of Hap-9, Hap-10, Hap-15.1, Hap-18.2 showed non-significant differences on the regulation of SPC, but revealed differences at the significant level in the governing of SOC; whereas the haplotype alleles of Hap-12 revealed differences at the significant level in the governing of SPC but revealed differences at the non-significant level in the governing of SOC. These findings suggest the SOC and SPC traits of soybean possess complicated genetic structure, where some genetic loci have positive effects on both SOC and SPC traits, and some genetic loci showed negative correlations in the regulation of SOC and SPC; and some loci have independent effects on either SOC or SPC. Our study showed that alleles of each haplotype block regulate the varied phenotypes of SOC and SPC, thus delivering an opportunity to optimize the desired quantity of SOC and SPC in the soybean cultivar. These haplotypes can be used to produce cultivars of soybean with optimized as well as improved SOC and SPC, hence will substantially impact the quality and yield of soybeans.</p>
</sec>
<sec id="s4_4">
<label>4.4</label>
<title>Stable QTLs detected for SOC and SPC traits</title>
<p>By considering the genomic regions (&#xb1; half LD-decay distance) flanking the two significant SNPs detected through various models and environments as well as the LD decay distance across the 15 identified haplotype blocks, we delineated a total of 17 stable QTLs associated with SOC or SPC or both traits. Among these 17 QTLs, 11 of them fell within the genomic interval of previously reported QTLs, hence not being considered as novel QTLs (<xref ref-type="supplementary-material" rid="SF2"><bold>Supplementary Figure&#xa0;2</bold></xref>). For example, <xref ref-type="bibr" rid="B94">Zhang et&#xa0;al. (2025)</xref> identified the significant SNP associated with SPC on Chr.06, and that SNP fell within the genomic interval of <italic>qSOC_SPC6.1</italic> (5133255&#x2013;5365962 bp). The <italic>qSOC_SPC6.2</italic> present on Chr.06 was present in the genomic regions of earlier reported QTLs viz., cqSeed protein-015 (5449370&#x2013;7326665 bp) and cqSeed oil-016 (5504147&#x2013;8260733 bp) (<xref ref-type="bibr" rid="B61">Pathan et&#xa0;al., 2013</xref>). Hence, the <italic>qSOC_SPC6.2</italic> might belong to the same cqSeed protein-015 and cqSeed oil-016 QTLs, as previously reported by <xref ref-type="bibr" rid="B61">Pathan et&#xa0;al. (2013)</xref>. The <italic>qSOC8.1</italic> fell within the genomic region (7525742- 9439751) of previously reported QTL viz., Seed oil 11-g2 (<xref ref-type="bibr" rid="B87">Yao et&#xa0;al., 2020</xref>). Similarly, <italic>qSOC8.2</italic> fell within the genomic regions (7966391- 11892640) of earlier reported QTL viz., Seed oil 1-1 (<xref ref-type="bibr" rid="B48">Mansur et&#xa0;al., 1993</xref>). The physical interval of <italic>qSOC8.3</italic> was located within the genomic region of earlier reported QTL viz., Seed oil 43-1 (<xref ref-type="bibr" rid="B49">Mao et&#xa0;al., 2013</xref>). The <italic>qSOC_SPC8</italic> present on the Chr.08 fell within the physical intervals of earlier reported QTLs viz., Seed oil 8-g13 (<xref ref-type="bibr" rid="B95">Zhang et&#xa0;al., 2018b</xref>) and Seed protein 34-5 (<xref ref-type="bibr" rid="B46">Lu et&#xa0;al., 2013</xref>) QTLs, hence <italic>qSOC_SPC8</italic> might be the same QTLs as that of Seed oil 8-g13 and Seed protein 34-5. The <italic>qSOC10</italic> present on the Chr.10 was located within the physical interval (44580197- 44718071) of earlier reported QTL viz., Seed oil 39-16, hence representing the same QTL (<xref ref-type="bibr" rid="B78">Wang et&#xa0;al., 2014</xref>). Moreover, the <italic>qSPC12</italic> fell within the genomic region (4520131- 6391062) of previously reported QTL viz., Seed protein 28-3 (<xref ref-type="bibr" rid="B41">Liang et&#xa0;al., 2010</xref>). <italic>qSOC15</italic> located on the Chr.15 might be the same QTLs as previously reported mqSeed Oil-014 (<xref ref-type="bibr" rid="B64">Qi et&#xa0;al., 2011</xref>), as the <italic>qSOC15</italic> fell within the genomic interval (10392903-10393032) of mqSeed Oil-014. The <italic>qSPC18</italic> lied across the genomic region (1736692-56797602) of earlier documented QTL viz., Seed protein 36-25 (<xref ref-type="bibr" rid="B49">Mao et&#xa0;al., 2013</xref>). The <italic>qSPC20</italic> fell within the genomic interval (2615587&#x2013;41000124 bp) of previously reported QTL viz., Seed protein 36-26 (<xref ref-type="bibr" rid="B49">Mao et&#xa0;al., 2013</xref>). Zhao et&#xa0;al (<xref ref-type="bibr" rid="B98">2024</xref>) found that the SNP named rs20739 present on Chr.18 was associated with SOC, which fell within the genomic interval of <italic>qSOC18</italic> (57712803-57856803). However, no QTL was identified to date that lies across the genomic interval of <italic>qSOC1</italic>, <italic>qSPC1</italic>, <italic>qSOC9</italic>, <italic>qSOC_SPC15.1</italic> and <italic>qSOC_SPC15.2</italic> (<xref ref-type="supplementary-material" rid="SF2"><bold>Supplementary Figure&#xa0;2</bold></xref>). Therefore, these five QTLs were newly reported/novel QTLs for SOC or/and SPC identified in the current study. Here, we report that GWAS analysis substantially diminished the genomic interval of the earlier detected QTLs, thus providing the proof for the higher resolution of GWAS analysis in QTL identification. The classical mapping method possesses reduced resolution because it utilizes the biparental population in the genetic mapping, that in turn results in a larger confidence interval of earlier documented QTLs (<xref ref-type="bibr" rid="B88">Yu et&#xa0;al., 2024</xref>). Hence, high-resolution stable QTLs identified by the GWAS in the current study will be potentially harnessed in the molecular breeding programs for the improvement of SOC and SPC in soybean.</p>
</sec>
<sec id="s4_5">
<label>4.5</label>
<title>Identifying potential candidate genes regulating SOC and SPC in soybean</title>
<p>The central objective of the researcher is to find-out true candidate genes governing the trait of interest that are underlying the major QTLs. Successful validation of function for the candidate genes underlying the QTLs will dictate their potential use in breeding programs. The true genes regulating the SOC and SPC traits have remained largely unexplored, and only a few genes regulating these traits in soybean have been characterized (as reviewed by <xref ref-type="bibr" rid="B54">Mo et&#xa0;al. (2024)</xref>). Based on the <italic>in-silico</italic>, sequence variation, variant annotation and haplotype analysis, we prioritized 80 genes as the candidates regulating the SOC and SPC in Northeast China soybeans. Among them, 12 genes undergo divergent selection between low-latitudes and high-latitudes; hence, these 12 genes will be considered as the potential candidates regulating SOC and SPC traits in soybean, as well as regulating the difference in the quality traits among the soybeans adapted to different environments. For example, the ortholog of <italic>Glyma.01G175500</italic> in <italic>Arabidopsis thaliana</italic> is <italic>CYP90B1</italic> (<xref ref-type="bibr" rid="B93">Zhang et&#xa0;al., 2024a</xref>). The <italic>CYP90B1</italic> encodes the steroid C-22 hydroxylase that plays an important role in the sterol biosynthesis (<xref ref-type="bibr" rid="B93">Zhang et&#xa0;al., 2024a</xref>). The ortholog of <italic>Glyma.01G176000</italic> is <italic>EMB2754</italic>, and the <italic>EMB2754</italic> encodes the Vacuolar sorting protein 39, and has been reported to transport the proteins into vacuoles during seed development (<xref ref-type="bibr" rid="B75">Tsao et&#xa0;al., 2022</xref>), and lipid transfer in Arabidopsis (<xref ref-type="bibr" rid="B52">Michaud et&#xa0;al., 2017</xref>). The <italic>Glyma.08G101100</italic> ortholog in Arabidopsis is <italic>AT1G67680</italic> that encodes SRP72; the SRP protein mediates the transport of secretory proteins to the endoplasmic reticulum (ER) in plants, and it has been documented that storage proteins reach the protein storage vacuoles (PSV) through a vesicle-mediated biosynthetic trafficking pathway that includes the ER, the Golgi apparatus, the tubulovesicular network (TGN) and the endosomes/prevacuoles (<xref ref-type="bibr" rid="B91">Zeng et&#xa0;al., 2023</xref>). <italic>Glyma.08G101900</italic> is an ortholog of <italic>AT5G40780</italic> which encodes lysine histidine transporter 1 (LHT1) in Arabidopsis (<xref ref-type="bibr" rid="B7">Chen and Bush, 1997</xref>). The LHT1 is a high-affinity transporter for cellular amino acids in both roots and shoots, hence is important in the biosynthesis of proteins (<xref ref-type="bibr" rid="B66">Rabby et&#xa0;al., 2022</xref>). In soybean the <italic>Glyma.08G103100</italic> is an ortholog of <italic>AT1G24330</italic> which encodes the ARM repeat superfamily protein; and this protein belongs to E3 ubiquitin ligase. In Brassica species the ARM repeat protein viz., ARC1 acts downstream of the S receptor kinase to promote ubiquitination and protein degradation (<xref ref-type="bibr" rid="B73">Stone et&#xa0;al., 2003</xref>). The <italic>Glyma.08G111700</italic> and <italic>Glyma.08G111800</italic> are the ortholog of <italic>AT5G55160/SUMO2/ATSUMO2</italic> which encodes for small ubiquitin-like modifier 2 in Arabidopsis (<xref ref-type="table" rid="T2"><bold>Table&#xa0;2</bold></xref>). The ubiquitin-like modifier stabilizes the proteins to which it is conjugated; and removal of the ubiquitin-like modifier results in degradation of the proteins (<xref ref-type="bibr" rid="B53">Miura et&#xa0;al., 2009</xref>). Gene viz., <italic>Glyma.08G117000</italic> is an ortholog of <italic>AT5G45800</italic>/<italic>MEE62</italic> that encodes for leucine-rich repeat protein kinase family protein, and these proteins have been documented to play important roles in plant growth, development and stress responses (<xref ref-type="bibr" rid="B71">Song et&#xa0;al., 2022</xref>). The <italic>Glyma.15G232200</italic> is an ortholog of <italic>AT3G56710/SIB1</italic> gene that encodes for sigma factor binding protein 1; and this gene has been documented to play an important role under nitrogen starvation, and nitrogen is the primary component in the protein synthesis (<xref ref-type="bibr" rid="B67">Ramel et&#xa0;al., 2007</xref>). The <italic>Glyma.18G258000</italic> and <italic>Glyma.18G258100</italic> are the orthologs of <italic>AT3G29590/AT5MAT</italic> and <italic>AT3G49190</italic>, respectively that encode for acyl-transferase family proteins, and these proteins are important in the <italic>de-novo</italic> fatty-acid biosynthesis (<xref ref-type="bibr" rid="B85">Yang et&#xa0;al., 2021</xref>). Moreover, the ortholog of <italic>Glyma.18G259100</italic> in <italic>Arabidopsis thaliana</italic> is <italic>AT3G28910/MYB30</italic> (<xref ref-type="bibr" rid="B44">Liu et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B84">Yan et&#xa0;al., 2020</xref>). The MYB30 belongs to subgroup I, that governs the biosynthesis of very-long-chain fatty acids (VLCFAs) by regulating genes encoding the four enzymes of the acyl-CoA elongase complex (<xref ref-type="bibr" rid="B101">Zhukov and Popov, 2022</xref>). Hence, the divergent selection of these 12 genes across the soybean populations adapted to different regions might be the reason of the unique characteristics of the SOC and SPC in Northeast China.</p>
<p>In conclusion, we identified the haplotype alleles within the 15 haplotype blocks as well as within the 80 candidate genes across the soybean germplasm of 340 accessions that regulate the SOC or SPC or both traits from the minimum to maximum levels through different intermediate phenotypes. Hence, these haplotypes can be used to produce cultivars of soybean with desired SOC and SPC.</p>
<p>Besides, we identified key genes that were divergently selected between the soybeans adapted to different regions of China, and they might be the important genes regulating the difference in the SOC and SPC across the various latitude regions.</p>
</sec>
</sec>
<sec id="s5" sec-type="conclusions">
<label>5</label>
<title>Conclusion</title>
<p>Here, we utilized a comprehensive approach to find-out the genetic structure of SOC and SPC traits in high-latitude adapted soybeans. The present study identified 105 and 59 significant SNPs associated with the SOC and SPC traits, respectively across the germplasm; and among them only three significant SNPs were associated with both SOC and SPC. Besides, we identified a total of 15 haplotype blocks distributed on nine chromosomes. Among them 14 and 11 haplotype blocks were linked with SOC and SPC, respectively. Furthermore, the present study identified 17 QTLs associated with either SOC or SPC or both traits; five of them were novel identified for the first time. <italic>In-silico</italic> analyses allowed us to prioritize 121 putative candidate genes present across the genomic regions of the 17 identified QTLs. Furthermore, based on the sequence variation, variant annotation, and haplotype analysis, 80 of the 121 genes were screened out as potential candidates regulating the SOC and/or SPC traits. In these 80 genes, the haplotype allele number varied from 2&#x2013;8 across soybean germplasm of 340 accessions. Overall, the haplotype alleles identified in the 15 haplotype blocks and 80 candidate genes across the 340 accessions regulate the SOC or/and SPC from the minimum to maximum levels through intermediate phenotypes. Furthermore, our results revealed that 12 of these 80 genes were divergently selected below low- and high-latitudes; hence they might be the major genes regulating the difference in the SOC and SPC traits in the low-latitudes and high-latitudes. We identified many independent SNPs, haplotypes and QTLs associated with either SOC or SPC that can provide the opportunity to improve these two highly negatively-correlated traits simultaneously in the same soybean cultivar. Overall, the insights generated from this study provide valuable genomic resources for the optimization of the SOC and SPC in the soybean cultivars. In conclusion, the novel findings reported in this study hold significant potential for developing Northeast-China adapted soybean cultivars with enhanced quality and yield.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found below: <uri xlink:href="https://ngdc.cncb.ac.cn/gvm/">https://ngdc.cncb.ac.cn/gvm/</uri>, GVM000764.</p></sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>MB: Data curation, Formal analysis, Investigation, Methodology, Validation, Visualization, Writing &#x2013; original draft. YZ: Data curation, Formal analysis, Writing &#x2013; review &amp; editing. WX: Data curation, Formal analysis, Writing &#x2013; review &amp; editing. YL: Data curation, Formal analysis, Writing &#x2013; review &amp; editing. HY: Writing &#x2013; review &amp; editing, Data curation, Formal analysis. YHZ: Data curation, Formal analysis, Writing &#x2013; review &amp; editing. SY: Funding acquisition, Project administration, Resources, Supervision, Writing &#x2013; review &amp; editing. JB: Data curation, Formal analysis, Methodology, Writing &#x2013; original draft. XF: Conceptualization, Funding acquisition, Methodology, Project administration, Resources, Supervision, Writing &#x2013; review &amp; editing.</p></sec>
<ack>
<title>Acknowledgments</title>
<p>We want to thank &#x201c;Changchun Computing Center&#x201d; and &#x201c;Eco-Innovation Center&#x201d; for providing inclusive computing power and technical support during the completion of this paper.</p>
</ack>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
<sec id="s10" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec id="s11" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p></sec>
<sec id="s12" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2026.1767299/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2026.1767299/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="DataSheet1.docx" id="SF1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Figure&#xa0;1</label>
<caption>
<p>Frequency distribution of the SOC <bold>(A)</bold> and SPC <bold>(B)</bold> in the GWAS panel of 340 soybean accessions across the four different environments viz., CC22, CC23, CC24 &amp; JT24.</p>
</caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.docx" id="SF2" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Figure&#xa0;2</label>
<caption>
<p>Map showing the comparison of the QTLs identified in the present study with the previously reported QTLs.</p>
</caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.docx" id="SF3" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Figure&#xa0;3</label>
<caption>
<p>Diagram showing the <italic>F<sub>ST</sub></italic>, <italic>&#x3c0;</italic> and Tajima&#x2019;s <italic>D</italic> analysis of population differentiation as well as distribution of the different haplotypes of <italic>Glyma.01G175500</italic> and <italic>Glyma.01G176000</italic> genes across the soybeans adapted to different latitudes (China-I to China-VI).</p>
</caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.docx" id="SF4" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Figure&#xa0;4</label>
<caption>
<p>Diagram showing the <italic>F<sub>ST</sub></italic>, <italic>&#x3c0;</italic> and Tajima&#x2019;s <italic>D</italic> analysis of population differentiation as well as distribution of the different haplotypes of <italic>Glyma.08G101100</italic>, <italic>Glyma.08G101900</italic> and <italic>Glyma.06G103100</italic> genes across the soybeans adapted to different latitudes (China-I to China-VI).</p>
</caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.docx" id="SF5" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Figure&#xa0;5</label>
<caption>
<p>Diagram showing the <italic>F<sub>ST</sub></italic>, <italic>&#x3c0;</italic> and Tajima&#x2019;s <italic>D</italic> analysis of population differentiation as well as distribution of the different haplotypes of <italic>Glyma.08G111700</italic>, and <italic>Glyma.06G111800</italic> genes across the soybeans adapted to different latitudes (China-I to China-VI).</p>
</caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.docx" id="SF6" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Figure&#xa0;6</label>
<caption>
<p>Diagram showing the <italic>F<sub>ST</sub></italic>, <italic>&#x3c0;</italic> and Tajima&#x2019;s <italic>D</italic> analysis of population differentiation as well as distribution of the different haplotypes of <italic>Glyma.08G117000</italic>, across the soybeans adapted to different latitudes (China-I to China-VI).</p>
</caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.docx" id="SF7" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Figure&#xa0;7</label>
<caption>
<p>Diagram showing the <italic>F<sub>ST</sub></italic>, <italic>&#x3c0;</italic> and Tajima&#x2019;s <italic>D</italic> analysis of population differentiation as well as distribution of the different haplotypes of <italic>Glyma.15G232200</italic> across the soybeans adapted to different latitudes (China-I to China-VI).</p>
</caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.docx" id="SF8" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Figure&#xa0;8</label>
<caption>
<p>Diagram showing the <italic>F<sub>ST</sub></italic>, <italic>&#x3c0;</italic> and Tajima&#x2019;s <italic>D</italic> analysis of population differentiation as well as distribution of the different haplotypes of <italic>Glyma.18G258000</italic>, <italic>Glyma.18G258100</italic> and <italic>Glyma.18G259100</italic> genes across the soybeans adapted to different latitudes (China-I to China-VI).</p>
</caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.docx" id="SF9" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Table&#xa0;1</label>
<caption>
<p>List of 340 soybean accessions along with their geographic origin used in the GWAS analysis.</p>
</caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.docx" id="SF10" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Table&#xa0;2</label>
<caption>
<p>Phenotypic analysis of seed oil content (SOC) and seed protein content (SPC) of 340 soybean accessions evaluated in different individual environments plus combined environment (CE).</p>
</caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.docx" id="SF11" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Table&#xa0;3</label>
<caption>
<p>Distribution of the SNPs used for GWAS across soybean chromosomes.</p>
</caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.docx" id="SF12" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Table&#xa0;4</label>
<caption>
<p>SNP markers and stable QTLs significantly associated with seed oil content (SOC) and seed protein content (SPC) across different environments and models.</p>
</caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.docx" id="SF13" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Table&#xa0;5</label>
<caption>
<p>Haplotype analysis of 15 haplotype blocks identified in the present study across the panel of 340 soybean accessions.</p>
</caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.docx" id="SF14" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Table&#xa0;6</label>
<caption>
<p>Phenotypic variance explained (PVE) by the identified 17 stable QTLs in the combined environment.</p>
</caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.docx" id="SF15" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Table&#xa0;7</label>
<caption>
<p>Putative candidate genes selected based on the <italic>in-silico</italic> analysis and gene function annotation across the 17 QTLs.</p>
</caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.docx" id="SF16" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Table&#xa0;8</label>
<caption>
<p>Variant annotation of selected putative candidate genes (only 104 among the total 121 genes selected based on the <italic>in-silico</italic> analysis and gene function annotation showed variant annotation).</p>
</caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.docx" id="SF17" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"><label>Supplementary Table&#xa0;9</label>
<caption>
<p>The haplotype analysis results of the candidate genes.</p>
</caption></supplementary-material>
<supplementary-material xlink:href="Table1.xlsx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Abbai</surname> <given-names>R.</given-names></name>
<name><surname>Singh</surname> <given-names>V. K.</given-names></name>
<name><surname>Nachimuthu</surname> <given-names>V. V.</given-names></name>
<name><surname>Sinha</surname> <given-names>P.</given-names></name>
<name><surname>Selvaraj</surname> <given-names>R.</given-names></name>
<name><surname>Vipparla</surname> <given-names>A. K.</given-names></name>
<etal/>
</person-group>. (<year>2019</year>). 
<article-title>Haplotype analysis of key genes governing grain yield and quality traits across 3K RG panel reveals scope for the development of tailor-made rice with enhanced genetic gains</article-title>. <source>Plant Biotechnol. J.</source> <volume>17</volume>, <fpage>1612</fpage>&#x2013;<lpage>1622</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/pbi.13087</pub-id>, PMID: <pub-id pub-id-type="pmid">30701663</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Alqudah</surname> <given-names>A. M.</given-names></name>
<name><surname>Sallam</surname> <given-names>A.</given-names></name>
<name><surname>Stephen Baenziger</surname> <given-names>P.</given-names></name>
<name><surname>B&#xf6;rner</surname> <given-names>A.</given-names></name>
</person-group> (<year>2020</year>). 
<article-title>GWAS: Fast-forwarding gene identification and characterization in temperate Cereals: lessons from Barley &#x2013; A review</article-title>. <source>J. Advanced Res.</source> <volume>22</volume>, <fpage>119</fpage>&#x2013;<lpage>135</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jare.2019.10.013</pub-id>, PMID: <pub-id pub-id-type="pmid">31956447</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Barrett</surname> <given-names>J. C.</given-names></name>
<name><surname>Fry</surname> <given-names>B.</given-names></name>
<name><surname>Maller</surname> <given-names>J.</given-names></name>
<name><surname>Daly</surname> <given-names>M. J.</given-names></name>
</person-group> (<year>2004</year>). 
<article-title>Haploview: analysis and visualization of LD and haplotype maps</article-title>. <source>Bioinformatics</source> <volume>21</volume>, <fpage>263</fpage>&#x2013;<lpage>265</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bth457</pub-id>, PMID: <pub-id pub-id-type="pmid">15297300</pub-id>
</mixed-citation>
</ref>
<ref id="B4">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bates</surname> <given-names>D.</given-names></name>
<name><surname>M&#xe4;chler</surname> <given-names>M.</given-names></name>
<name><surname>Bolker</surname> <given-names>B.</given-names></name>
<name><surname>Walker</surname> <given-names>S.</given-names></name>
</person-group> (<year>2015</year>). 
<article-title>Fitting linear mixed-effects models using lme4</article-title>. <source>J. Stat. Software</source> <volume>67</volume>, <fpage>1</fpage>&#x2013;<lpage>48</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.18637/jss.v067.i01</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bhat</surname> <given-names>J. A.</given-names></name>
<name><surname>Yu</surname> <given-names>D.</given-names></name>
<name><surname>Bohra</surname> <given-names>A.</given-names></name>
<name><surname>Ganie</surname> <given-names>S. A.</given-names></name>
<name><surname>Varshney</surname> <given-names>R. K.</given-names></name>
</person-group> (<year>2021</year>). 
<article-title>Features and applications of haplotypes in crop breeding</article-title>. <source>Commun. Biol.</source> <volume>4</volume>, <fpage>1266</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s42003-021-02782-y</pub-id>, PMID: <pub-id pub-id-type="pmid">34737387</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Capilla-P&#xe9;rez</surname> <given-names>L.</given-names></name>
<name><surname>Solier</surname> <given-names>V.</given-names></name>
<name><surname>Gilbault</surname> <given-names>E.</given-names></name>
<name><surname>Lian</surname> <given-names>Q.</given-names></name>
<name><surname>Goel</surname> <given-names>M.</given-names></name>
<name><surname>Huettel</surname> <given-names>B.</given-names></name>
<etal/>
</person-group>. (<year>2024</year>). 
<article-title>Enhanced recombination empowers the detection and mapping of Quantitative Trait Loci</article-title>. <source>Commun. Biol.</source> <volume>7</volume>, <fpage>829</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s42003-024-06530-w</pub-id>, PMID: <pub-id pub-id-type="pmid">38977904</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Chen</surname> <given-names>L.</given-names></name>
<name><surname>Bush</surname> <given-names>D. R.</given-names></name>
</person-group> (<year>1997</year>). 
<article-title>LHT1, a lysine- and histidine-specific amino acid transporter in Arabidopsis</article-title>. <source>Plant Physiol.</source> <volume>115</volume>, <fpage>1127</fpage>&#x2013;<lpage>1134</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1104/pp.115.3.1127</pub-id>, PMID: <pub-id pub-id-type="pmid">9390441</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Chen</surname> <given-names>L.</given-names></name>
<name><surname>Taliercio</surname> <given-names>E.</given-names></name>
<name><surname>Li</surname> <given-names>Z.</given-names></name>
<name><surname>Mian</surname> <given-names>R.</given-names></name>
<name><surname>Carter</surname> <given-names>T. E.</given-names></name>
<name><surname>Wei</surname> <given-names>H.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>Characterization of a <italic>G. max</italic>&#x2009;&#xd7;&#x2009;<italic>G. soja</italic> nested association mapping population and identification of loci controlling seed composition traits from wild soybean</article-title>. <source>Theor. Appl. Genet.</source> <volume>138</volume>, <fpage>65</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00122-025-04848-5</pub-id>, PMID: <pub-id pub-id-type="pmid">40053052</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Chen</surname> <given-names>S.</given-names></name>
<name><surname>Zhou</surname> <given-names>Y.</given-names></name>
<name><surname>Chen</surname> <given-names>Y.</given-names></name>
<name><surname>Gu</surname> <given-names>J.</given-names></name>
</person-group> (<year>2018</year>). 
<article-title>fastp: an ultra-fast all-in-one FASTQ preprocessor</article-title>. <source>Bioinformatics</source> <volume>34</volume>, <fpage>i884</fpage>&#x2013;<lpage>i890</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bty560</pub-id>, PMID: <pub-id pub-id-type="pmid">30423086</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Cingolani</surname> <given-names>P.</given-names></name>
<name><surname>Platts</surname> <given-names>A.</given-names></name>
<name><surname>Wang</surname> <given-names>L. L.</given-names></name>
<name><surname>Coon</surname> <given-names>M.</given-names></name>
<name><surname>Nguyen</surname> <given-names>T.</given-names></name>
<name><surname>Wang</surname> <given-names>L.</given-names></name>
<etal/>
</person-group>. (<year>2012</year>). 
<article-title>A program for annotating and predicting the effects of single nucleotide polymorphisms, SnpEff: SNPs in the genome of Drosophila melanogaster strain w<sup>1118</sup>; iso-2; iso-3</article-title>. <source>Fly</source> <volume>6</volume>, <fpage>80</fpage>&#x2013;<lpage>92</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.4161/fly.19695</pub-id>, PMID: <pub-id pub-id-type="pmid">22728672</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Conway</surname> <given-names>J. R.</given-names></name>
<name><surname>Lex</surname> <given-names>A.</given-names></name>
<name><surname>Gehlenborg</surname> <given-names>N.</given-names></name>
</person-group> (<year>2017</year>). 
<article-title>UpSetR: an R package for the visualization of intersecting sets and their properties</article-title>. <source>Bioinformatics</source> <volume>33</volume>, <fpage>2938</fpage>&#x2013;<lpage>2940</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btx364</pub-id>, PMID: <pub-id pub-id-type="pmid">28645171</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Cook</surname> <given-names>D. E.</given-names></name>
<name><surname>Andersen</surname> <given-names>E. C.</given-names></name>
</person-group> (<year>2017</year>). 
<article-title>VCF-kit: assorted utilities for the variant call format</article-title>. <source>Bioinformatics</source> <volume>33</volume>, <fpage>1581</fpage>&#x2013;<lpage>1582</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btx011</pub-id>, PMID: <pub-id pub-id-type="pmid">28093408</pub-id>
</mixed-citation>
</ref>
<ref id="B13">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Danecek</surname> <given-names>P.</given-names></name>
<name><surname>Auton</surname> <given-names>A.</given-names></name>
<name><surname>Abecasis</surname> <given-names>G.</given-names></name>
<name><surname>Albers</surname> <given-names>C. A.</given-names></name>
<name><surname>Banks</surname> <given-names>E.</given-names></name>
<name><surname>DePristo</surname> <given-names>M. A.</given-names></name>
<etal/>
</person-group>. (<year>2011</year>). 
<article-title>The variant call format and VCFtools</article-title>. <source>Bioinformatics</source> <volume>27</volume>, <fpage>2156</fpage>&#x2013;<lpage>2158</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btr330</pub-id>, PMID: <pub-id pub-id-type="pmid">21653522</pub-id>
</mixed-citation>
</ref>
<ref id="B14">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Diers</surname> <given-names>B. W.</given-names></name>
<name><surname>Specht</surname> <given-names>J. E.</given-names></name>
<name><surname>Graef</surname> <given-names>G. L.</given-names></name>
<name><surname>Song</surname> <given-names>Q.</given-names></name>
<name><surname>Rainey</surname> <given-names>K. M.</given-names></name>
<name><surname>Ramasubramanian</surname> <given-names>V.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title>Genetic architecture of protein and oil content in soybean seed and meal</article-title>. <source>Plant Genome</source> <volume>16</volume>, <fpage>e20308</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/tpg2.20308</pub-id>, PMID: <pub-id pub-id-type="pmid">36744727</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Doszhanova</surname> <given-names>B.</given-names></name>
<name><surname>Zatybekov</surname> <given-names>A.</given-names></name>
<name><surname>Didorenko</surname> <given-names>S.</given-names></name>
<name><surname>Fang</surname> <given-names>C.</given-names></name>
<name><surname>Abugalieva</surname> <given-names>S.</given-names></name>
<name><surname>Turuspekov</surname> <given-names>Y.</given-names></name>
</person-group> (<year>2024</year>). 
<article-title>Genome-wide association study of seed quality and yield traits in a soybean collection from southeast Kazakhstan</article-title>. <source>Agronomy</source> <volume>14</volume>, <fpage>2746</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/agronomy14112746</pub-id>
</mixed-citation>
</ref>
<ref id="B16">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Duan</surname> <given-names>Z.</given-names></name>
<name><surname>Li</surname> <given-names>Q.</given-names></name>
<name><surname>Wang</surname> <given-names>H.</given-names></name>
<name><surname>He</surname> <given-names>X.</given-names></name>
<name><surname>Zhang</surname> <given-names>M.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>Genetic regulatory networks of soybean seed size, oil and protein contents</article-title>. <source>Front. Plant Sci.</source> <volume>14</volume>, <elocation-id>1160418</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2023.1160418</pub-id>, PMID: <pub-id pub-id-type="pmid">36959925</pub-id>
</mixed-citation>
</ref>
<ref id="B17">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Duan</surname> <given-names>Z.</given-names></name>
<name><surname>Xu</surname> <given-names>L.</given-names></name>
<name><surname>Zhou</surname> <given-names>G.</given-names></name>
<name><surname>Zhu</surname> <given-names>Z.</given-names></name>
<name><surname>Wang</surname> <given-names>X.</given-names></name>
<name><surname>Shen</surname> <given-names>Y.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>Unlocking soybean potential: genetic resources and omics for breeding</article-title>. <source>J. Genet. Genomics</source> <volume>52</volume>(<issue>11</issue>), <page-range>1337&#x2013;1346</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jgg.2025.02.004</pub-id>, PMID: <pub-id pub-id-type="pmid">39984157</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Duggal</surname> <given-names>P.</given-names></name>
<name><surname>Gillanders</surname> <given-names>E. M.</given-names></name>
<name><surname>Holmes</surname> <given-names>T. N.</given-names></name>
<name><surname>Bailey-Wilson</surname> <given-names>J. E.</given-names></name>
</person-group> (<year>2008</year>). 
<article-title>Establishing an adjusted p-value threshold to control the family-wide type 1 error in genome wide association studies</article-title>. <source>BMC Genomics</source> <volume>9</volume>, <elocation-id>516</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2164-9-516</pub-id>, PMID: <pub-id pub-id-type="pmid">18976480</pub-id>
</mixed-citation>
</ref>
<ref id="B19">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Gao</surname> <given-names>W.</given-names></name>
<name><surname>Ma</surname> <given-names>R.</given-names></name>
<name><surname>Li</surname> <given-names>X.</given-names></name>
<name><surname>Liu</surname> <given-names>J.</given-names></name>
<name><surname>Jiang</surname> <given-names>A.</given-names></name>
<name><surname>Tan</surname> <given-names>P.</given-names></name>
<etal/>
</person-group>. (<year>2024</year>). 
<article-title>Construction of genetic map and QTL mapping for seed size and quality traits in soybean (<italic>Glycine max</italic> L.)</article-title>. <source>Int. J. Mol. Sci.</source> <volume>25</volume>, <elocation-id>2857</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/ijms25052857</pub-id>, PMID: <pub-id pub-id-type="pmid">38474104</pub-id>
</mixed-citation>
</ref>
<ref id="B20">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Gu</surname> <given-names>Z.</given-names></name>
<name><surname>Eils</surname> <given-names>R.</given-names></name>
<name><surname>Schlesner</surname> <given-names>M.</given-names></name>
</person-group> (<year>2016</year>). 
<article-title>Complex heatmaps reveal patterns and correlations in multidimensional genomic data</article-title>. <source>Bioinformatics</source> <volume>32</volume>, <fpage>2847</fpage>&#x2013;<lpage>2849</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btw313</pub-id>, PMID: <pub-id pub-id-type="pmid">27207943</pub-id>
</mixed-citation>
</ref>
<ref id="B21">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Guo</surname> <given-names>B.</given-names></name>
<name><surname>Sun</surname> <given-names>L.</given-names></name>
<name><surname>Jiang</surname> <given-names>S.</given-names></name>
<name><surname>Ren</surname> <given-names>H.</given-names></name>
<name><surname>Sun</surname> <given-names>R.</given-names></name>
<name><surname>Wei</surname> <given-names>Z.</given-names></name>
<etal/>
</person-group>. (<year>2022</year>). 
<article-title>Soybean genetic resources contributing to sustainable protein production</article-title>. <source>Theor. Appl. Genet.</source> <volume>135</volume>, <fpage>4095</fpage>&#x2013;<lpage>4121</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00122-022-04222-9</pub-id>, PMID: <pub-id pub-id-type="pmid">36239765</pub-id>
</mixed-citation>
</ref>
<ref id="B22">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Guo</surname> <given-names>Y.</given-names></name>
<name><surname>Huang</surname> <given-names>Y.</given-names></name>
<name><surname>Hou</surname> <given-names>L.</given-names></name>
<name><surname>Ma</surname> <given-names>J.</given-names></name>
<name><surname>Chen</surname> <given-names>C.</given-names></name>
<name><surname>Ai</surname> <given-names>H.</given-names></name>
<etal/>
</person-group>. (<year>2017</year>). 
<article-title>Genome-wide detection of genetic markers associated with growth and fatness in four pig populations using four approaches</article-title>. <source>Genet. Selection Evol.</source> <volume>49</volume>, <fpage>21</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12711-017-0295-4</pub-id>, PMID: <pub-id pub-id-type="pmid">28196480</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>He</surname> <given-names>J.</given-names></name>
<name><surname>Gai</surname> <given-names>J.</given-names></name>
</person-group> (<year>2023</year>). &#x201c;
<article-title>Genome-Wide Association Studies (GWAS)</article-title>,&#x201d; in <source>Plant Genotyping: Methods and Protocols</source>. Ed. 
<person-group person-group-type="editor">
<name><surname>Shavrukov</surname> <given-names>Y.</given-names></name>
</person-group> (
<publisher-name>Springer US</publisher-name>, <publisher-loc>New York, NY</publisher-loc>), <fpage>123</fpage>&#x2013;<lpage>146</lpage>.
</mixed-citation>
</ref>
<ref id="B24">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>He</surname> <given-names>Q.</given-names></name>
<name><surname>Xiang</surname> <given-names>S.</given-names></name>
<name><surname>Yang</surname> <given-names>H.</given-names></name>
<name><surname>Wang</surname> <given-names>W.</given-names></name>
<name><surname>Shu</surname> <given-names>Y.</given-names></name>
<name><surname>Li</surname> <given-names>Z.</given-names></name>
<etal/>
</person-group>. (<year>2021</year>). 
<article-title>A genome-wide association study of seed size, protein content, and oil content using a natural population of Sichuan and Chongqing soybean</article-title>. <source>Euphytica</source> <volume>217</volume>, <fpage>198</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10681-021-02931-8</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hellsten</surname> <given-names>U.</given-names></name>
<name><surname>Wright</surname> <given-names>K. M.</given-names></name>
<name><surname>Jenkins</surname> <given-names>J.</given-names></name>
<name><surname>Shu</surname> <given-names>S.</given-names></name>
<name><surname>Yuan</surname> <given-names>Y.</given-names></name>
<name><surname>Wessler</surname> <given-names>S. R.</given-names></name>
<etal/>
</person-group>. (<year>2013</year>). 
<article-title>Fine-scale variation in meiotic recombination in Mimulus inferred from population shotgun sequencing</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>110</volume>, <fpage>19478</fpage>&#x2013;<lpage>19482</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1319032110</pub-id>, PMID: <pub-id pub-id-type="pmid">24225854</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Jin</surname> <given-names>H.</given-names></name>
<name><surname>Yang</surname> <given-names>X.</given-names></name>
<name><surname>Zhao</surname> <given-names>H.</given-names></name>
<name><surname>Song</surname> <given-names>X.</given-names></name>
<name><surname>Tsvetkov</surname> <given-names>Y. D.</given-names></name>
<name><surname>Wu</surname> <given-names>Y.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title>Genetic analysis of protein content and oil content in soybean by genome-wide association study</article-title>. <source>Front. Plant Sci.</source> <volume>14</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2023.1182771</pub-id>, PMID: <pub-id pub-id-type="pmid">37346139</pub-id>
</mixed-citation>
</ref>
<ref id="B27">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kalantar Ahmadi</surname> <given-names>S. A.</given-names></name>
<name><surname>Sarhangi</surname> <given-names>M.</given-names></name>
</person-group> (<year>2025</year>). 
<article-title>Optimizing sowing date for enhanced heat stress tolerance in canola (<italic>Brassica napus</italic> L.): Investigating impacts on seed yield, oil content, and fatty acids composition</article-title>. <source>Heliyon</source> <volume>11</volume>, <elocation-id>e42138</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.heliyon.2025.e42138</pub-id>, PMID: <pub-id pub-id-type="pmid">39925356</pub-id>
</mixed-citation>
</ref>
<ref id="B28">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kaler</surname> <given-names>A. S.</given-names></name>
<name><surname>Gillman</surname> <given-names>J. D.</given-names></name>
<name><surname>Beissinger</surname> <given-names>T.</given-names></name>
<name><surname>Purcell</surname> <given-names>L. C.</given-names></name>
</person-group> (<year>2020</year>). 
<article-title>Comparing different statistical models and multiple testing corrections for association mapping in soybean and maize</article-title>. <source>Front. Plant Sci.</source> <volume>10</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2019.01794</pub-id>, PMID: <pub-id pub-id-type="pmid">32158452</pub-id>
</mixed-citation>
</ref>
<ref id="B29">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Karges</surname> <given-names>K.</given-names></name>
<name><surname>Bellingrath-Kimura</surname> <given-names>S. D.</given-names></name>
<name><surname>Watson</surname> <given-names>C. A.</given-names></name>
<name><surname>Stoddard</surname> <given-names>F. L.</given-names></name>
<name><surname>Halwani</surname> <given-names>M.</given-names></name>
<name><surname>Reckling</surname> <given-names>M.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>Agro-economic prospects for expanding soybean production beyond its current northerly limit in Europe</article-title>. <source>Eur. J. Agron.</source> <volume>133</volume>, <elocation-id>126415</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.eja.2021.126415</pub-id>
</mixed-citation>
</ref>
<ref id="B30">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Karikari</surname> <given-names>B.</given-names></name>
<name><surname>Li</surname> <given-names>S.</given-names></name>
<name><surname>Bhat</surname> <given-names>J. A.</given-names></name>
<name><surname>Cao</surname> <given-names>Y.</given-names></name>
<name><surname>Kong</surname> <given-names>J.</given-names></name>
<name><surname>Yang</surname> <given-names>J.</given-names></name>
<etal/>
</person-group>. (<year>2019</year>). 
<article-title>Genome-wide detection of major and epistatic effect QTLs for seed protein and oil content in soybean under multiple environments using high-density bin map</article-title>. <source>Int. J. Mol. Sci.</source> <volume>20</volume>, <fpage>979</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/ijms20040979</pub-id>, PMID: <pub-id pub-id-type="pmid">30813455</pub-id>
</mixed-citation>
</ref>
<ref id="B31">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kim</surname> <given-names>W. J.</given-names></name>
<name><surname>Kang</surname> <given-names>B. H.</given-names></name>
<name><surname>Kang</surname> <given-names>S.</given-names></name>
<name><surname>Shin</surname> <given-names>S.</given-names></name>
<name><surname>Chowdhury</surname> <given-names>S.</given-names></name>
<name><surname>Jeong</surname> <given-names>S. C.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title>A genome-wide association study of protein, oil, and amino acid content in wild soybean (<italic>Glycine soja</italic>)</article-title>. <source>Plants</source> <volume>12</volume>, <fpage>1665</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/plants12081665</pub-id>, PMID: <pub-id pub-id-type="pmid">37111888</pub-id>
</mixed-citation>
</ref>
<ref id="B32">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kuroha</surname> <given-names>T.</given-names></name>
<name><surname>Nagai</surname> <given-names>K.</given-names></name>
<name><surname>Gamuyao</surname> <given-names>R.</given-names></name>
<name><surname>Wang</surname> <given-names>D. R.</given-names></name>
<name><surname>Furuta</surname> <given-names>T.</given-names></name>
<name><surname>Nakamori</surname> <given-names>M.</given-names></name>
<etal/>
</person-group>. (<year>2018</year>). 
<article-title>Ethylene-gibberellin signaling underlies adaptation of rice to periodic flooding</article-title>. <source>Science</source> <volume>361</volume>, <fpage>181</fpage>&#x2013;<lpage>186</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.aat1577</pub-id>, PMID: <pub-id pub-id-type="pmid">30002253</pub-id>
</mixed-citation>
</ref>
<ref id="B33">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lander</surname> <given-names>E.</given-names></name>
<name><surname>Kruglyak</surname> <given-names>L.</given-names></name>
</person-group> (<year>1995</year>). 
<article-title>Genetic dissection of complex traits: guidelines for interpreting and reporting linkage results</article-title>. <source>Nat. Genet.</source> <volume>11</volume>, <fpage>241</fpage>&#x2013;<lpage>247</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/ng1195-241</pub-id>, PMID: <pub-id pub-id-type="pmid">7581446</pub-id>
</mixed-citation>
</ref>
<ref id="B34">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lee</surname> <given-names>S.</given-names></name>
<name><surname>Van</surname> <given-names>K.</given-names></name>
<name><surname>Sung</surname> <given-names>M.</given-names></name>
<name><surname>Nelson</surname> <given-names>R.</given-names></name>
<name><surname>LaMantia</surname> <given-names>J.</given-names></name>
<name><surname>McHale</surname> <given-names>L. K.</given-names></name>
<etal/>
</person-group>. (<year>2019</year>). 
<article-title>Genome-wide association study of seed protein, oil and amino acid contents in soybean from maturity groups I to IV</article-title>. <source>Theor. Appl. Genet.</source> <volume>132</volume>, <fpage>1639</fpage>&#x2013;<lpage>1659</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00122-019-03304-5</pub-id>, PMID: <pub-id pub-id-type="pmid">30806741</pub-id>
</mixed-citation>
</ref>
<ref id="B35">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Leventhal</surname> <given-names>L.</given-names></name>
<name><surname>Ruffley</surname> <given-names>M.</given-names></name>
<name><surname>Exposito-Alonso</surname> <given-names>M.</given-names></name>
</person-group> (<year>2025</year>). 
<article-title>). Planting genomes in the wild: Arabidopsis from genetics history to the ecology and evolutionary genomics era</article-title>. <source>Annu. Rev. Plant Biol.</source> <volume>76</volume>, <fpage>605</fpage>&#x2013;<lpage>635</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1146/annurev-arplant-071123-095146</pub-id>, PMID: <pub-id pub-id-type="pmid">39971350</pub-id>
</mixed-citation>
</ref>
<ref id="B36">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Li</surname> <given-names>H.</given-names></name>
</person-group> (<year>2013</year>). 
<article-title>Aligning sequence reads, clone sequences and assembly contigs with BWA-MEM</article-title>. <source>arXiv preprint arXiv:1303.3997</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.48550/arXiv.1303.3997</pub-id>
</mixed-citation>
</ref>
<ref id="B37">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Li</surname> <given-names>H.</given-names></name>
<name><surname>Peng</surname> <given-names>Z.</given-names></name>
<name><surname>Yang</surname> <given-names>X.</given-names></name>
<name><surname>Wang</surname> <given-names>W.</given-names></name>
<name><surname>Fu</surname> <given-names>J.</given-names></name>
<name><surname>Wang</surname> <given-names>J.</given-names></name>
<etal/>
</person-group>. (<year>2013</year>). 
<article-title>Genome-wide association study dissects the genetic architecture of oil biosynthesis in maize kernels</article-title>. <source>Nat. Genet.</source> <volume>45</volume>(<issue>1</issue>), <fpage>43</fpage>&#x2013;<lpage>50</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/ng.2484</pub-id>, PMID: <pub-id pub-id-type="pmid">23242369</pub-id>
</mixed-citation>
</ref>
<ref id="B38">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Li</surname> <given-names>J.</given-names></name>
<name><surname>Zhang</surname> <given-names>Y.</given-names></name>
<name><surname>Ma</surname> <given-names>R.</given-names></name>
<name><surname>Huang</surname> <given-names>W.</given-names></name>
<name><surname>Hou</surname> <given-names>J.</given-names></name>
<name><surname>Fang</surname> <given-names>C.</given-names></name>
<etal/>
</person-group>. (<year>2022</year>). 
<article-title>Identification of <italic>ST1</italic> reveals a selection involving hitchhiking of seed morphology and oil content during soybean domestication</article-title>. <source>Plant Biotechnol. J.</source> <volume>20</volume>, <fpage>1110</fpage>&#x2013;<lpage>1121</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/pbi.13791</pub-id>, PMID: <pub-id pub-id-type="pmid">35178867</pub-id>
</mixed-citation>
</ref>
<ref id="B39">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Li</surname> <given-names>D.</given-names></name>
<name><surname>Zhao</surname> <given-names>X.</given-names></name>
<name><surname>Han</surname> <given-names>Y.</given-names></name>
<name><surname>Li</surname> <given-names>W.</given-names></name>
<name><surname>Xie</surname> <given-names>F.</given-names></name>
</person-group> (<year>2019</year>). 
<article-title>Genome-wide association mapping for seed protein and oil contents using a large panel of soybean accessions</article-title>. <source>Genomics</source> <volume>111</volume>, <fpage>90</fpage>&#x2013;<lpage>95</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ygeno.2018.01.004</pub-id>, PMID: <pub-id pub-id-type="pmid">29325965</pub-id>
</mixed-citation>
</ref>
<ref id="B40">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Liang</surname> <given-names>Q.</given-names></name>
<name><surname>Chen</surname> <given-names>L.</given-names></name>
<name><surname>Yang</surname> <given-names>X.</given-names></name>
<name><surname>Yang</surname> <given-names>H.</given-names></name>
<name><surname>Liu</surname> <given-names>S.</given-names></name>
<name><surname>Kou</surname> <given-names>K.</given-names></name>
<etal/>
</person-group>. (<year>2022</year>). 
<article-title>Natural variation of <italic>Dt2</italic> determines branching in soybean</article-title>. <source>Nat. Commun.</source> <volume>13</volume>, <fpage>6429</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41467-022-34153-4</pub-id>, PMID: <pub-id pub-id-type="pmid">36307423</pub-id>
</mixed-citation>
</ref>
<ref id="B41">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Liang</surname> <given-names>H.</given-names></name>
<name><surname>Yu</surname> <given-names>Y.</given-names></name>
<name><surname>Wang</surname> <given-names>S.</given-names></name>
<name><surname>Lian</surname> <given-names>Y.</given-names></name>
<name><surname>Wang</surname> <given-names>T.</given-names></name>
<name><surname>Wei</surname> <given-names>Y.</given-names></name>
<etal/>
</person-group>. (<year>2010</year>). 
<article-title>QTL mapping of isoflavone, oil and protein contents in soybean (<italic>Glycine max</italic> L. Merr.)</article-title>. <source>Agric. Sci. China</source> <volume>9</volume>, <fpage>1108</fpage>&#x2013;<lpage>1116</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/s1671-2927(09)60197-8</pub-id>
</mixed-citation>
</ref>
<ref id="B42">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lipka</surname> <given-names>A. E.</given-names></name>
<name><surname>Tian</surname> <given-names>F.</given-names></name>
<name><surname>Wang</surname> <given-names>Q.</given-names></name>
<name><surname>Peiffer</surname> <given-names>J.</given-names></name>
<name><surname>Li</surname> <given-names>M.</given-names></name>
<name><surname>Bradbury</surname> <given-names>P. J.</given-names></name>
<etal/>
</person-group>. (<year>2012</year>). 
<article-title>GAPIT: genome association and prediction integrated tool</article-title>. <source>Bioinformatics</source> <volume>28</volume>(<issue>18</issue>), <fpage>2397</fpage>&#x2013;<lpage>2399</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bts444</pub-id>, PMID: <pub-id pub-id-type="pmid">22796960</pub-id>
</mixed-citation>
</ref>
<ref id="B43">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Liu</surname> <given-names>Z.</given-names></name>
<name><surname>Shi</surname> <given-names>X.</given-names></name>
<name><surname>Yang</surname> <given-names>Q.</given-names></name>
<name><surname>Li</surname> <given-names>Y.</given-names></name>
<name><surname>Yang</surname> <given-names>C.</given-names></name>
<name><surname>Zhang</surname> <given-names>M.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>Landscape of rare-allele variants in cultivated and wild soybean genomes</article-title>. <source>Plant Genome</source> <volume>18</volume>, <fpage>e70020</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/tpg2.70020</pub-id>, PMID: <pub-id pub-id-type="pmid">40148071</pub-id>
</mixed-citation>
</ref>
<ref id="B44">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Liu</surname> <given-names>L.</given-names></name>
<name><surname>Zhang</surname> <given-names>J.</given-names></name>
<name><surname>Adrian</surname> <given-names>J.</given-names></name>
<name><surname>Gissot</surname> <given-names>L.</given-names></name>
<name><surname>Coupland</surname> <given-names>G.</given-names></name>
<name><surname>Yu</surname> <given-names>D.</given-names></name>
<etal/>
</person-group>. (<year>2014</year>). 
<article-title>Elevated levels of <italic>MYB30</italic> in the phloem accelerate flowering in Arabidopsis through the regulation of FLOWERING LOCUS T</article-title>. <source>PloS One</source> <volume>9</volume>, <fpage>e89799</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0089799</pub-id>, PMID: <pub-id pub-id-type="pmid">24587042</pub-id>
</mixed-citation>
</ref>
<ref id="B45">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Liu</surname> <given-names>Y.</given-names></name>
<name><surname>Zhang</surname> <given-names>Y.</given-names></name>
<name><surname>Liu</surname> <given-names>X.</given-names></name>
<name><surname>Shen</surname> <given-names>Y.</given-names></name>
<name><surname>Tian</surname> <given-names>D.</given-names></name>
<name><surname>Yang</surname> <given-names>X.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title>SoyOmics: A deeply integrated database on soybean multi-omics</article-title>. <source>Mol. Plant</source> <volume>16</volume>, <fpage>794</fpage>&#x2013;<lpage>797</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.molp.2023.03.011</pub-id>, PMID: <pub-id pub-id-type="pmid">36950735</pub-id>
</mixed-citation>
</ref>
<ref id="B46">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lu</surname> <given-names>W.</given-names></name>
<name><surname>Wen</surname> <given-names>Z.</given-names></name>
<name><surname>Li</surname> <given-names>H.</given-names></name>
<name><surname>Yuan</surname> <given-names>D.</given-names></name>
<name><surname>Li</surname> <given-names>J.</given-names></name>
<name><surname>Zhang</surname> <given-names>H.</given-names></name>
<etal/>
</person-group>. (<year>2013</year>). 
<article-title>Identification of the quantitative trait loci (QTL) underlying water soluble protein content in soybean</article-title>. <source>Theor. Appl. Genet.</source> <volume>126</volume>, <fpage>425</fpage>&#x2013;<lpage>433</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00122-012-1990-8</pub-id>, PMID: <pub-id pub-id-type="pmid">23052024</pub-id>
</mixed-citation>
</ref>
<ref id="B47">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Majidian</surname> <given-names>P.</given-names></name>
<name><surname>Ghorbani</surname> <given-names>H. R.</given-names></name>
<name><surname>Farajpour</surname> <given-names>M.</given-names></name>
</person-group> (<year>2024</year>). 
<article-title>Achieving agricultural sustainability through soybean production in Iran: Potential and challenges</article-title>. <source>Heliyon</source> <volume>10</volume>(<issue>4</issue>), <elocation-id>e26389</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.heliyon.2024.e26389</pub-id>, PMID: <pub-id pub-id-type="pmid">38404839</pub-id>
</mixed-citation>
</ref>
<ref id="B48">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Mansur</surname> <given-names>L. M.</given-names></name>
<name><surname>Lark</surname> <given-names>K. G.</given-names></name>
<name><surname>Kross</surname> <given-names>H.</given-names></name>
<name><surname>Oliveira</surname> <given-names>A.</given-names></name>
</person-group> (<year>1993</year>). 
<article-title>Interval mapping of quantitative trait loci for reproductive, morphological, and seed traits of soybean (<italic>Glycine max</italic> L.)</article-title>. <source>Theor. Appl. Genet.</source> <volume>86</volume>, <fpage>907</fpage>&#x2013;<lpage>913</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/BF00211040</pub-id>, PMID: <pub-id pub-id-type="pmid">24193996</pub-id>
</mixed-citation>
</ref>
<ref id="B49">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Mao</surname> <given-names>T.</given-names></name>
<name><surname>Jiang</surname> <given-names>Z.</given-names></name>
<name><surname>Han</surname> <given-names>Y.</given-names></name>
<name><surname>Teng</surname> <given-names>W.</given-names></name>
<name><surname>Zhao</surname> <given-names>X.</given-names></name>
<name><surname>Li</surname> <given-names>W.</given-names></name>
</person-group> (<year>2013</year>). 
<article-title>Identification of quantitative trait loci underlying seed protein and oil contents of soybean across multi-genetic backgrounds and environments</article-title>. <source>Plant Breed.</source> <volume>132</volume>, <fpage>630</fpage>&#x2013;<lpage>641</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/pbr.12091</pub-id>
</mixed-citation>
</ref>
<ref id="B50">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>McKenna</surname> <given-names>A.</given-names></name>
<name><surname>Hanna</surname> <given-names>M.</given-names></name>
<name><surname>Banks</surname> <given-names>E.</given-names></name>
<name><surname>Sivachenko</surname> <given-names>A.</given-names></name>
<name><surname>Cibulskis</surname> <given-names>K.</given-names></name>
<name><surname>Kernytsky</surname> <given-names>A.</given-names></name>
<etal/>
</person-group>. (<year>2010</year>). 
<article-title>The Genome Analysis Toolkit: a MapReduce framework for analyzing next-generation DNA sequencing data</article-title>. <source>Genome Res.</source> <volume>20</volume>, <fpage>1297</fpage>&#x2013;<lpage>1303</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/gr.107524.110</pub-id>, PMID: <pub-id pub-id-type="pmid">20644199</pub-id>
</mixed-citation>
</ref>
<ref id="B51">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Merrick</surname> <given-names>L. F.</given-names></name>
<name><surname>Burke</surname> <given-names>A. B.</given-names></name>
<name><surname>Zhang</surname> <given-names>Z.</given-names></name>
<name><surname>Carter</surname> <given-names>A. H.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>Comparison of single-trait and multi-trait genome-wide association models and inclusion of correlated traits in the dissection of the genetic architecture of a complex trait in a breeding program</article-title>. <source>Front. Plant Sci.</source> <volume>12</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2021.772907</pub-id>, PMID: <pub-id pub-id-type="pmid">35154175</pub-id>
</mixed-citation>
</ref>
<ref id="B52">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Michaud</surname> <given-names>M.</given-names></name>
<name><surname>Prinz</surname> <given-names>W. A.</given-names></name>
<name><surname>Jouhet</surname> <given-names>J.</given-names></name>
</person-group> (<year>2017</year>). 
<article-title>Glycerolipid synthesis and lipid trafficking in plant mitochondria</article-title>. <source>FEBS J.</source> <volume>284</volume>, <fpage>376</fpage>&#x2013;<lpage>390</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/febs.13812</pub-id>, PMID: <pub-id pub-id-type="pmid">27406373</pub-id>
</mixed-citation>
</ref>
<ref id="B53">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Miura</surname> <given-names>K.</given-names></name>
<name><surname>Lee</surname> <given-names>J.</given-names></name>
<name><surname>Jin</surname> <given-names>J. B.</given-names></name>
<name><surname>Yoo</surname> <given-names>C. Y.</given-names></name>
<name><surname>Miura</surname> <given-names>T.</given-names></name>
<name><surname>Hasegawa</surname> <given-names>P. M.</given-names></name>
</person-group> (<year>2009</year>). 
<article-title>Sumoylation of ABI5 by the <italic>Arabidopsis</italic> SUMO E3 ligase SIZ1 negatively regulates abscisic acid signaling</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>106</volume>, <fpage>5418</fpage>&#x2013;<lpage>5423</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.0811088106</pub-id>, PMID: <pub-id pub-id-type="pmid">19276109</pub-id>
</mixed-citation>
</ref>
<ref id="B54">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Mo</surname> <given-names>W.</given-names></name>
<name><surname>Wang</surname> <given-names>P.</given-names></name>
<name><surname>Shi</surname> <given-names>Q.</given-names></name>
<name><surname>Zhao</surname> <given-names>X.</given-names></name>
<name><surname>Zheng</surname> <given-names>X.</given-names></name>
<name><surname>Ji</surname> <given-names>L.</given-names></name>
<etal/>
</person-group>. (<year>2024</year>). 
<article-title>Uncovering key genes associated with protein and oil in soybeans based on transcriptomics and proteomics</article-title>. <source>Ind. Crops Products</source> <volume>222</volume>, <elocation-id>119981</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.indcrop.2024.119981</pub-id>
</mixed-citation>
</ref>
<ref id="B55">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Moore Ronald</surname> <given-names>E. R.</given-names></name>
<name><surname>Wyman</surname> <given-names>C.</given-names></name>
<name><surname>Cunicelli</surname> <given-names>M. J.</given-names></name>
<name><surname>Olukolu</surname> <given-names>B.</given-names></name>
<name><surname>Sams</surname> <given-names>C. E.</given-names></name>
<name><surname>West</surname> <given-names>D. R.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>Quantitative trait loci governing seed protein, oil, and linolenic acid concentration in soybean</article-title>. <source>J. Am. Oil Chemists&#x2019; Soc.</source> <volume>102</volume>, <fpage>137</fpage>&#x2013;<lpage>150</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/aocs.12876</pub-id>
</mixed-citation>
</ref>
<ref id="B56">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Mukherjee</surname> <given-names>T.</given-names></name>
<name><surname>Tully</surname> <given-names>T. L. A.</given-names></name>
<name><surname>Allen</surname> <given-names>D. K.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>GmMFT: a potential step forward in soybean breeding for high oil and yield</article-title>. <source>New Phytol.</source> <volume>239</volume>, <fpage>815</fpage>&#x2013;<lpage>817</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/nph.18950</pub-id>, PMID: <pub-id pub-id-type="pmid">37227027</pub-id>
</mixed-citation>
</ref>
<ref id="B57">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Murray</surname> <given-names>M. G.</given-names></name>
<name><surname>Thompson</surname> <given-names>W. F.</given-names></name>
</person-group> (<year>1980</year>). 
<article-title>Rapid isolation of high molecular weight plant DNA</article-title>. <source>Nucleic Acids Res.</source> <volume>8</volume>, <fpage>4321</fpage>&#x2013;<lpage>4326</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/8.19.4321</pub-id>, PMID: <pub-id pub-id-type="pmid">7433111</pub-id>
</mixed-citation>
</ref>
<ref id="B58">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Nair</surname> <given-names>S. K.</given-names></name>
<name><surname>Rabbani</surname> <given-names>M. T.</given-names></name>
</person-group> (<year>2024</year>). &#x201c;
<article-title>Marker-assisted selection approaches for improving quality traits</article-title>,&#x201d; in <source>Smart Breeding</source> (<publisher-loc>New York</publisher-loc>: 
<publisher-name>Apple Academic Press</publisher-name>), <fpage>287</fpage>&#x2013;<lpage>328</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1201/9781003361862</pub-id>
</mixed-citation>
</ref>
<ref id="B59">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Odell</surname> <given-names>S. G.</given-names></name>
<name><surname>Hudson</surname> <given-names>A. I.</given-names></name>
<name><surname>Praud</surname> <given-names>S.</given-names></name>
<name><surname>Dubreuil</surname> <given-names>P.</given-names></name>
<name><surname>Tixier</surname> <given-names>M.-H.</given-names></name>
<name><surname>Ross-Ibarra</surname> <given-names>J.</given-names></name>
<etal/>
</person-group>. (<year>2022</year>). 
<article-title>Modeling allelic diversity of multiparent mapping populations affects detection of quantitative trait loci</article-title>. <source>G3 Genes|Genomes|Genetics</source> <volume>12</volume>(<issue>3</issue>), <elocation-id>jkac011</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/g3journal/jkac011</pub-id>, PMID: <pub-id pub-id-type="pmid">35100382</pub-id>
</mixed-citation>
</ref>
<ref id="B60">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Patel</surname> <given-names>J.</given-names></name>
<name><surname>Patel</surname> <given-names>S.</given-names></name>
<name><surname>Cook</surname> <given-names>L.</given-names></name>
<name><surname>Fallen</surname> <given-names>B. D.</given-names></name>
<name><surname>Koebernick</surname> <given-names>J.</given-names></name>
</person-group> (<year>2025</year>). 
<article-title>Soybean genome&#x2212;wide association study of seed weight, protein, and oil content in the southeastern USA</article-title>. <source>Mol. Genet. Genomics</source> <volume>300</volume>, <elocation-id>43</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00438-025-02228-8</pub-id>, PMID: <pub-id pub-id-type="pmid">40220041</pub-id>
</mixed-citation>
</ref>
<ref id="B61">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Pathan</surname> <given-names>S. M.</given-names></name>
<name><surname>Vuong</surname> <given-names>T.</given-names></name>
<name><surname>Clark</surname> <given-names>K.</given-names></name>
<name><surname>Lee</surname> <given-names>J.-D.</given-names></name>
<name><surname>Shannon</surname> <given-names>J. G.</given-names></name>
<name><surname>Roberts</surname> <given-names>C. A.</given-names></name>
<etal/>
</person-group>. (<year>2013</year>). 
<article-title>Genetic mapping and confirmation of quantitative trait loci for seed protein and oil contents and seed weight in soybean</article-title>. <source>Crop Sci.</source> <volume>53</volume>, <fpage>765</fpage>&#x2013;<lpage>774</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2135/cropsci2012.03.0153</pub-id>
</mixed-citation>
</ref>
<ref id="B62">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Patil</surname> <given-names>G.</given-names></name>
<name><surname>Do</surname> <given-names>T.</given-names></name>
<name><surname>Vuong</surname> <given-names>T. D.</given-names></name>
<name><surname>Valliyodan</surname> <given-names>B.</given-names></name>
<name><surname>Lee</surname> <given-names>J.-D.</given-names></name>
<name><surname>Chaudhary</surname> <given-names>J.</given-names></name>
<etal/>
</person-group>. (<year>2016</year>). 
<article-title>Genomic-assisted haplotype analysis and the development of high-throughput SNP markers for salinity tolerance in soybean</article-title>. <source>Sci. Rep.</source> <volume>6</volume>, <elocation-id>19199</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/srep19199</pub-id>, PMID: <pub-id pub-id-type="pmid">26781337</pub-id>
</mixed-citation>
</ref>
<ref id="B63">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Patil</surname> <given-names>G.</given-names></name>
<name><surname>Vuong</surname> <given-names>T. D.</given-names></name>
<name><surname>Kale</surname> <given-names>S.</given-names></name>
<name><surname>Valliyodan</surname> <given-names>B.</given-names></name>
<name><surname>Deshmukh</surname> <given-names>R.</given-names></name>
<name><surname>Zhu</surname> <given-names>C.</given-names></name>
<etal/>
</person-group>. (<year>2018</year>). 
<article-title>Dissecting genomic hotspots underlying seed protein, oil, and sucrose content in an interspecific mapping population of soybean using high-density linkage mapping</article-title>. <source>Plant Biotechnol. J.</source> <volume>16</volume>, <fpage>1939</fpage>&#x2013;<lpage>1953</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/pbi.12929</pub-id>, PMID: <pub-id pub-id-type="pmid">29618164</pub-id>
</mixed-citation>
</ref>
<ref id="B64">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Qi</surname> <given-names>Z.</given-names></name>
<name><surname>Han</surname> <given-names>X.</given-names></name>
<name><surname>Sun</surname> <given-names>Y.</given-names></name>
<name><surname>Wu</surname> <given-names>Q.</given-names></name>
<name><surname>Shan</surname> <given-names>D.</given-names></name>
<name><surname>Du</surname> <given-names>X.</given-names></name>
<etal/>
</person-group>. (<year>2011</year>). 
<article-title>An integrated quantitative trait locus map of oil content in soybean, <italic>Glycine max</italic> (L.) Merr., generated using a meta-analysis method for mining genes</article-title>. <source>Agric. Sci. China</source> <volume>10</volume>, <fpage>1681</fpage>&#x2013;<lpage>1692</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S1671-2927(11)60166-1</pub-id>
</mixed-citation>
</ref>
<ref id="B65">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Qin</surname> <given-names>C.</given-names></name>
<name><surname>Li</surname> <given-names>Y.-h.</given-names></name>
<name><surname>Li</surname> <given-names>D.</given-names></name>
<name><surname>Zhang</surname> <given-names>X.</given-names></name>
<name><surname>Kong</surname> <given-names>L.</given-names></name>
<name><surname>Zhou</surname> <given-names>Y.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title><italic>PH13</italic> improves soybean shade traits and enhances yield for high-density planting at high latitudes</article-title>. <source>Nat. Commun.</source> <volume>14</volume>, <fpage>6813</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41467-023-42608-5</pub-id>, PMID: <pub-id pub-id-type="pmid">37884530</pub-id>
</mixed-citation>
</ref>
<ref id="B66">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Rabby</surname> <given-names>M. G.</given-names></name>
<name><surname>Hossen</surname> <given-names>M. M.</given-names></name>
<name><surname>Kamal</surname> <given-names>M. M.</given-names></name>
<name><surname>Islam</surname> <given-names>M. N.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>Genome-wide identification and functional analysis of lysine histidine transporter (LHT) gene families in maize</article-title>. <source>Genet. Res.</source> <volume>2022</volume>, <elocation-id>2673748</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1155/2022/2673748</pub-id>, PMID: <pub-id pub-id-type="pmid">35528221</pub-id>
</mixed-citation>
</ref>
<ref id="B67">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ramel</surname> <given-names>F.</given-names></name>
<name><surname>Sulmon</surname> <given-names>C.</given-names></name>
<name><surname>Cabello-Hurtado</surname> <given-names>F.</given-names></name>
<name><surname>Taconnat</surname> <given-names>L.</given-names></name>
<name><surname>Martin-Magniette</surname> <given-names>M.-L.</given-names></name>
<name><surname>Renou</surname> <given-names>J.-P.</given-names></name>
<etal/>
</person-group>. (<year>2007</year>). 
<article-title>Genome-wide interacting effects of sucrose and herbicide-mediated stress in <italic>Arabidopsis thaliana</italic>: novel insights into atrazine toxicity and sucrose-induced tolerance</article-title>. <source>BMC Genomics</source> <volume>8</volume>, <elocation-id>450</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2164-8-450</pub-id>, PMID: <pub-id pub-id-type="pmid">18053238</pub-id>
</mixed-citation>
</ref>
<ref id="B68">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Rotundo</surname> <given-names>J. L.</given-names></name>
<name><surname>Miller-Garvin</surname> <given-names>J. E.</given-names></name>
<name><surname>Naeve</surname> <given-names>S. L.</given-names></name>
</person-group> (<year>2016</year>). 
<article-title>Regional and temporal variation in soybean seed protein and oil across the United States</article-title>. <source>Crop Sci.</source> <volume>56</volume>, <fpage>797</fpage>&#x2013;<lpage>808</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2135/cropsci2015.06.0394</pub-id>
</mixed-citation>
</ref>
<ref id="B69">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Shao</surname> <given-names>Z.</given-names></name>
<name><surname>Shao</surname> <given-names>J.</given-names></name>
<name><surname>Huo</surname> <given-names>X.</given-names></name>
<name><surname>Li</surname> <given-names>W.</given-names></name>
<name><surname>Kong</surname> <given-names>Y.</given-names></name>
<name><surname>Du</surname> <given-names>H.</given-names></name>
<etal/>
</person-group>. (<year>2022</year>). 
<article-title>Identification of closely associated SNPs and candidate genes with seed size and shape via deep re-sequencing GWAS in soybean</article-title>. <source>Theor. Appl. Genet.</source> <volume>135</volume>, <fpage>2341</fpage>&#x2013;<lpage>2351</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00122-022-04116-w</pub-id>, PMID: <pub-id pub-id-type="pmid">35588015</pub-id>
</mixed-citation>
</ref>
<ref id="B70">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Sinha</surname> <given-names>P.</given-names></name>
<name><surname>Singh</surname> <given-names>V. K.</given-names></name>
<name><surname>Saxena</surname> <given-names>R. K.</given-names></name>
<name><surname>Khan</surname> <given-names>A. W.</given-names></name>
<name><surname>Abbai</surname> <given-names>R.</given-names></name>
<name><surname>Chitikineni</surname> <given-names>A.</given-names></name>
<etal/>
</person-group>. (<year>2020</year>). 
<article-title>Superior haplotypes for haplotype-based breeding for drought tolerance in pigeonpea (<italic>Cajanus cajan</italic> L.)</article-title>. <source>Plant Biotechnol. J.</source> <volume>18</volume>, <fpage>2482</fpage>&#x2013;<lpage>2490</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/pbi.13422</pub-id>, PMID: <pub-id pub-id-type="pmid">32455481</pub-id>
</mixed-citation>
</ref>
<ref id="B71">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Song</surname> <given-names>M.</given-names></name>
<name><surname>Linghu</surname> <given-names>B.</given-names></name>
<name><surname>Huang</surname> <given-names>S.</given-names></name>
<name><surname>Li</surname> <given-names>F.</given-names></name>
<name><surname>An</surname> <given-names>R.</given-names></name>
<name><surname>Xie</surname> <given-names>C.</given-names></name>
<etal/>
</person-group>. (<year>2022</year>). 
<article-title>Genome-wide survey of leucine-rich repeat receptor-like protein kinase genes and CRISPR/Cas9-targeted mutagenesis <italic>BnBRI1</italic> in <italic>Brassica napus</italic></article-title>. <source>Front. Plant Sci.</source> <volume>13</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2022.865132</pub-id>, PMID: <pub-id pub-id-type="pmid">35498707</pub-id>
</mixed-citation>
</ref>
<ref id="B72">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Song</surname> <given-names>W.</given-names></name>
<name><surname>Sun</surname> <given-names>S.</given-names></name>
<name><surname>Wu</surname> <given-names>T.</given-names></name>
<name><surname>Yang</surname> <given-names>R.</given-names></name>
<name><surname>Tian</surname> <given-names>S.</given-names></name>
<name><surname>Xu</surname> <given-names>C.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title>Geographic distributions and the regionalization of soybean seed compositions across China</article-title>. <source>Food Res. Int.</source> <volume>164</volume>, <elocation-id>112364</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.foodres.2022.112364</pub-id>, PMID: <pub-id pub-id-type="pmid">36737952</pub-id>
</mixed-citation>
</ref>
<ref id="B73">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Stone</surname> <given-names>S. L.</given-names></name>
<name><surname>Anderson</surname> <given-names>E. M.</given-names></name>
<name><surname>Mullen</surname> <given-names>R. T.</given-names></name>
<name><surname>Goring</surname> <given-names>D. R.</given-names></name>
</person-group> (<year>2003</year>). 
<article-title>ARC1 Is an E3 ubiquitin ligase and promotes the ubiquitination of proteins during the rejection of self-incompatible Brassica pollen</article-title>. <source>Plant Cell</source> <volume>15</volume>, <fpage>885</fpage>&#x2013;<lpage>898</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1105/tpc.009845</pub-id>, PMID: <pub-id pub-id-type="pmid">12671085</pub-id>
</mixed-citation>
</ref>
<ref id="B74">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Tian</surname> <given-names>T.</given-names></name>
<name><surname>Liu</surname> <given-names>Y.</given-names></name>
<name><surname>Yan</surname> <given-names>H.</given-names></name>
<name><surname>You</surname> <given-names>Q.</given-names></name>
<name><surname>Yi</surname> <given-names>X.</given-names></name>
<name><surname>Du</surname> <given-names>Z.</given-names></name>
<etal/>
</person-group>. (<year>2017</year>). 
<article-title>agriGO v2.0: a GO analysis toolkit for the agricultural community 2017 update</article-title>. <source>Nucleic Acids Res.</source> <volume>45</volume>, <fpage>W122</fpage>&#x2013;<lpage>W129</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkx382</pub-id>, PMID: <pub-id pub-id-type="pmid">28472432</pub-id>
</mixed-citation>
</ref>
<ref id="B75">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Tsao</surname> <given-names>H. E.</given-names></name>
<name><surname>Lui</surname> <given-names>S. N.</given-names></name>
<name><surname>Lo</surname> <given-names>A. H. F.</given-names></name>
<name><surname>Chen</surname> <given-names>S.</given-names></name>
<name><surname>Wong</surname> <given-names>H. Y.</given-names></name>
<name><surname>Wong</surname> <given-names>C. K.</given-names></name>
<etal/>
</person-group>. (<year>2022</year>). 
<article-title>Structural insights into how vacuolar sorting receptors recognize the sorting determinants of seed storage proteins</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>119</volume>, <fpage>e2111281119</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.2111281119</pub-id>, PMID: <pub-id pub-id-type="pmid">34983843</pub-id>
</mixed-citation>
</ref>
<ref id="B76">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Van</surname> <given-names>K.</given-names></name>
<name><surname>Lee</surname> <given-names>S.</given-names></name>
<name><surname>Mian</surname> <given-names>M. A. R.</given-names></name>
<name><surname>McHale</surname> <given-names>L. K.</given-names></name>
</person-group> (<year>2025</year>). 
<article-title>Network analysis combined with genome-wide association study helps identification of genes related to amino acid contents in soybean</article-title>. <source>BMC Genomics</source> <volume>26</volume>, <fpage>21</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12864-024-11163-8</pub-id>, PMID: <pub-id pub-id-type="pmid">39780068</pub-id>
</mixed-citation>
</ref>
<ref id="B77">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Voorrips</surname> <given-names>R. E.</given-names></name>
<name><surname>Tumino</surname> <given-names>G.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>PolyHaplotyper: haplotyping in polyploids based on bi-allelic marker dosage data</article-title>. <source>BMC Bioinf.</source> <volume>23</volume>, <fpage>442</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12859-022-04989-0</pub-id>, PMID: <pub-id pub-id-type="pmid">36274121</pub-id>
</mixed-citation>
</ref>
<ref id="B78">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>X.</given-names></name>
<name><surname>Jiang</surname> <given-names>G.</given-names></name>
<name><surname>Green</surname> <given-names>M.</given-names></name>
<name><surname>Scott</surname> <given-names>R. A.</given-names></name>
<name><surname>Song</surname> <given-names>Q.</given-names></name>
<name><surname>Hyten</surname> <given-names>D. L.</given-names></name>
<etal/>
</person-group>. (<year>2014</year>). 
<article-title>Identification and validation of quantitative trait loci for seed yield, oil and protein contents in two recombinant inbred line populations of soybean</article-title>. <source>Mol. Genet. Genomics</source> <volume>289</volume>, <fpage>935</fpage>&#x2013;<lpage>949</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00438-014-0865-x</pub-id>, PMID: <pub-id pub-id-type="pmid">24861102</pub-id>
</mixed-citation>
</ref>
<ref id="B79">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>S.</given-names></name>
<name><surname>Liu</surname> <given-names>S.</given-names></name>
<name><surname>Wang</surname> <given-names>J.</given-names></name>
<name><surname>Yokosho</surname> <given-names>K.</given-names></name>
<name><surname>Zhou</surname> <given-names>B.</given-names></name>
<name><surname>Yu</surname> <given-names>Y.</given-names></name>
<etal/>
</person-group>. (<year>2020</year>). 
<article-title>Simultaneous changes in seed size, oil content and protein content driven by selection of <italic>SWEET</italic> homologues during soybean domestication</article-title>. <source>Natl. Sci. Rev.</source> <volume>7</volume>, <fpage>1776</fpage>&#x2013;<lpage>1786</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nsr/nwaa110</pub-id>, PMID: <pub-id pub-id-type="pmid">34691511</pub-id>
</mixed-citation>
</ref>
<ref id="B80">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>M.</given-names></name>
<name><surname>Yan</surname> <given-names>J.</given-names></name>
<name><surname>Zhao</surname> <given-names>J.</given-names></name>
<name><surname>Song</surname> <given-names>W.</given-names></name>
<name><surname>Zhang</surname> <given-names>X.</given-names></name>
<name><surname>Xiao</surname> <given-names>Y.</given-names></name>
<etal/>
</person-group>. (<year>2012</year>). 
<article-title>Genome-wide association study (GWAS) of resistance to head smut in maize</article-title>. <source>Plant Sci.</source> <volume>196</volume>, <fpage>125</fpage>&#x2013;<lpage>131</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.plantsci.2012.08.004</pub-id>, PMID: <pub-id pub-id-type="pmid">23017907</pub-id>
</mixed-citation>
</ref>
<ref id="B81">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>J.</given-names></name>
<name><surname>Zhang</surname> <given-names>Z.</given-names></name>
</person-group> (<year>2021</year>). 
<article-title>GAPIT version 3: boosting power and accuracy for genomic association and prediction</article-title>. <source>Genomics Proteomics Bioinf.</source> <volume>19</volume>, <fpage>629</fpage>&#x2013;<lpage>640</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.gpb.2021.08.005</pub-id>, PMID: <pub-id pub-id-type="pmid">34492338</pub-id>
</mixed-citation>
</ref>
<ref id="B82">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>X.</given-names></name>
<name><surname>Zhang</surname> <given-names>M.</given-names></name>
<name><surname>Li</surname> <given-names>F.</given-names></name>
<name><surname>Liu</surname> <given-names>X.</given-names></name>
<name><surname>Zhang</surname> <given-names>C.</given-names></name>
<name><surname>Zhang</surname> <given-names>F.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>Genome-wide association study reveals key genetic loci controlling oil content in soybean seeds</article-title>. <source>Agronomy</source> <volume>15</volume>, <fpage>1889</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/agronomy15081889</pub-id>
</mixed-citation>
</ref>
<ref id="B83">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wei</surname> <given-names>Z.</given-names></name>
<name><surname>Pan</surname> <given-names>T.</given-names></name>
<name><surname>Zhao</surname> <given-names>Y.</given-names></name>
<name><surname>Su</surname> <given-names>B.</given-names></name>
<name><surname>Ren</surname> <given-names>Y.</given-names></name>
<name><surname>Qiu</surname> <given-names>L.</given-names></name>
</person-group> (<year>2019</year>). 
<article-title>The small GTPase Rab5a and its guanine nucleotide exchange factors are involved in post-Golgi trafficking of storage proteins in developing soybean cotyledon</article-title>. <source>J. Exp. Bot.</source> <volume>71</volume>, <fpage>808</fpage>&#x2013;<lpage>822</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/jxb/erz454</pub-id>, PMID: <pub-id pub-id-type="pmid">31624827</pub-id>
</mixed-citation>
</ref>
<ref id="B84">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Yan</surname> <given-names>Y.</given-names></name>
<name><surname>Li</surname> <given-names>C.</given-names></name>
<name><surname>Dong</surname> <given-names>X.</given-names></name>
<name><surname>Li</surname> <given-names>H.</given-names></name>
<name><surname>Zhang</surname> <given-names>D.</given-names></name>
<name><surname>Zhou</surname> <given-names>Y.</given-names></name>
<etal/>
</person-group>. (<year>2020</year>). 
<article-title>MYB30 is a key negative regulator of Arabidopsis photomorphogenic development that promotes PIF4 and PIF5 protein accumulation in the light</article-title>. <source>Plant Cell</source> <volume>32</volume>, <fpage>2196</fpage>&#x2013;<lpage>2215</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1105/tpc.19.00645</pub-id>, PMID: <pub-id pub-id-type="pmid">32371543</pub-id>
</mixed-citation>
</ref>
<ref id="B85">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Yang</surname> <given-names>X.</given-names></name>
<name><surname>Liu</surname> <given-names>X.</given-names></name>
<name><surname>Zhou</surname> <given-names>Y.</given-names></name>
<name><surname>Zhang</surname> <given-names>F.</given-names></name>
<name><surname>Huang</surname> <given-names>L.</given-names></name>
<name><surname>Wang</surname> <given-names>J.</given-names></name>
<etal/>
</person-group>. (<year>2021</year>). 
<article-title>New insights on the function of plant acyl carrier proteins from comparative and evolutionary analysis</article-title>. <source>Genomics</source> <volume>113</volume>, <fpage>1155</fpage>&#x2013;<lpage>1165</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ygeno.2020.11.015</pub-id>, PMID: <pub-id pub-id-type="pmid">33221517</pub-id>
</mixed-citation>
</ref>
<ref id="B86">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Yang</surname> <given-names>Z.</given-names></name>
<name><surname>Luo</surname> <given-names>C.</given-names></name>
<name><surname>Pei</surname> <given-names>X.</given-names></name>
<name><surname>Wang</surname> <given-names>S.</given-names></name>
<name><surname>Huang</surname> <given-names>Y.</given-names></name>
<name><surname>Li</surname> <given-names>J.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title>SoyMD: a platform combining multi-omics data with various tools for soybean research and breeding</article-title>. <source>Nucleic Acids Res.</source> <volume>52</volume>, <fpage>D1639</fpage>&#x2013;<lpage>D1650</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkad786</pub-id>, PMID: <pub-id pub-id-type="pmid">37811889</pub-id>
</mixed-citation>
</ref>
<ref id="B87">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Yao</surname> <given-names>Y.</given-names></name>
<name><surname>You</surname> <given-names>Q.</given-names></name>
<name><surname>Duan</surname> <given-names>G.</given-names></name>
<name><surname>Ren</surname> <given-names>J.</given-names></name>
<name><surname>Chu</surname> <given-names>S.</given-names></name>
<name><surname>Zhao</surname> <given-names>J.</given-names></name>
<etal/>
</person-group>. (<year>2020</year>). 
<article-title>Quantitative trait loci analysis of seed oil content and composition of wild and cultivated soybean</article-title>. <source>BMC Plant Biol.</source> <volume>20</volume>, <fpage>51</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12870-019-2199-7</pub-id>, PMID: <pub-id pub-id-type="pmid">32005156</pub-id>
</mixed-citation>
</ref>
<ref id="B88">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Yu</surname> <given-names>H.</given-names></name>
<name><surname>Bhat</surname> <given-names>J. A.</given-names></name>
<name><surname>Li</surname> <given-names>C.</given-names></name>
<name><surname>Zhao</surname> <given-names>B.</given-names></name>
<name><surname>Bu</surname> <given-names>M.</given-names></name>
<name><surname>Zhang</surname> <given-names>Z.</given-names></name>
<etal/>
</person-group>. (<year>2024</year>). 
<article-title>Identification of superior and rare haplotypes to optimize branch number in soybean</article-title>. <source>Theor. Appl. Genet.</source> <volume>137</volume>, <fpage>93</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00122-024-04596-y</pub-id>, PMID: <pub-id pub-id-type="pmid">38570354</pub-id>
</mixed-citation>
</ref>
<ref id="B89">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Yuan</surname> <given-names>X.</given-names></name>
<name><surname>Jiang</surname> <given-names>X.</given-names></name>
<name><surname>Zhang</surname> <given-names>M.</given-names></name>
<name><surname>Wang</surname> <given-names>L.</given-names></name>
<name><surname>Jiao</surname> <given-names>W.</given-names></name>
<name><surname>Chen</surname> <given-names>H.</given-names></name>
<etal/>
</person-group>. (<year>2024</year>). 
<article-title>Integrative omics analysis elucidates the genetic basis underlying seed weight and oil content in soybean</article-title>. <source>Plant Cell</source> <volume>36</volume>, <fpage>2160</fpage>&#x2013;<lpage>2175</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/plcell/koae062</pub-id>, PMID: <pub-id pub-id-type="pmid">38412459</pub-id>
</mixed-citation>
</ref>
<ref id="B90">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zelaya Arce</surname> <given-names>M. S.</given-names></name>
<name><surname>Lago Tagliapietra</surname> <given-names>E. L.</given-names></name>
<name><surname>Minussi Winck</surname> <given-names>J. E.</given-names></name>
<name><surname>Ferigolo Alves</surname> <given-names>A.</given-names></name>
<name><surname>Schmidt Dalla Porta</surname> <given-names>F.</given-names></name>
<name><surname>Broilo Facco</surname> <given-names>T.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>Assessing genetics, biophysical, and management factors related to soybean seed protein variation in Brazil</article-title>. <source>Eur. J. Agron.</source> <volume>165</volume>, <elocation-id>127541</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.eja.2025.127541</pub-id>
</mixed-citation>
</ref>
<ref id="B91">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zeng</surname> <given-names>Y.</given-names></name>
<name><surname>Liang</surname> <given-names>Z.</given-names></name>
<name><surname>Liu</surname> <given-names>Z.</given-names></name>
<name><surname>Li</surname> <given-names>B.</given-names></name>
<name><surname>Cui</surname> <given-names>Y.</given-names></name>
<name><surname>Gao</surname> <given-names>C.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title>Recent advances in plant endomembrane research and new microscopical techniques</article-title>. <source>New Phytol.</source> <volume>240</volume>, <fpage>41</fpage>&#x2013;<lpage>60</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/nph.19134</pub-id>, PMID: <pub-id pub-id-type="pmid">37507353</pub-id>
</mixed-citation>
</ref>
<ref id="B92">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhang</surname> <given-names>C.</given-names></name>
<name><surname>Dong</surname> <given-names>S.</given-names></name>
<name><surname>Xu</surname> <given-names>J.</given-names></name>
<name><surname>He</surname> <given-names>W.</given-names></name>
<name><surname>Yang</surname> <given-names>T.</given-names></name>
</person-group> (<year>2018</year>a). 
<article-title>PopLDdecay: a fast and effective tool for linkage disequilibrium decay analysis based on variant call format files</article-title>. <source>Bioinformatics</source> <volume>35</volume>, <fpage>1786</fpage>&#x2013;<lpage>1788</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bty875</pub-id>, PMID: <pub-id pub-id-type="pmid">30321304</pub-id>
</mixed-citation>
</ref>
<ref id="B93">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhang</surname> <given-names>M.</given-names></name>
<name><surname>Song</surname> <given-names>H.</given-names></name>
<name><surname>Deng</surname> <given-names>X.</given-names></name>
<name><surname>Yang</surname> <given-names>M.</given-names></name>
</person-group> (<year>2024</year>a). 
<article-title>Genome-wide identification of CYP90 family and functional analysis of <italic>NnCYP90B1</italic> on rhizome enlargement in lotus</article-title>. <source>Vegetable Res.</source> <volume>4</volume>, <fpage>e035</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.48130/vegres-0024-0033</pub-id>
</mixed-citation>
</ref>
<ref id="B94">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhang</surname> <given-names>D.</given-names></name>
<name><surname>Sun</surname> <given-names>X.</given-names></name>
<name><surname>Hu</surname> <given-names>B.</given-names></name>
<name><surname>Li</surname> <given-names>W.-X.</given-names></name>
<name><surname>Ning</surname> <given-names>H.</given-names></name>
</person-group> (<year>2025</year>). 
<article-title>QTN mapping, gene prediction and molecular design breeding of seed protein content in soybean</article-title>. <source>Crop J.</source> <volume>13</volume>, <fpage>1116</fpage>&#x2013;<lpage>1126</lpage>.  doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cj.2025.06.011</pub-id>
</mixed-citation>
</ref>
<ref id="B95">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhang</surname> <given-names>J.</given-names></name>
<name><surname>Wang</surname> <given-names>X.</given-names></name>
<name><surname>Lu</surname> <given-names>Y.</given-names></name>
<name><surname>Bhusal</surname> <given-names>S. J.</given-names></name>
<name><surname>Song</surname> <given-names>Q.</given-names></name>
<name><surname>Cregan</surname> <given-names>P. B.</given-names></name>
<etal/>
</person-group>. (<year>2018</year>b). 
<article-title>Genome-wide scan for seed composition provides insights into soybean quality improvement and the impacts of domestication and breeding</article-title>. <source>Mol. Plant</source> <volume>11</volume>, <fpage>460</fpage>&#x2013;<lpage>472</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.molp.2017.12.016</pub-id>, PMID: <pub-id pub-id-type="pmid">29305230</pub-id>
</mixed-citation>
</ref>
<ref id="B96">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhang</surname> <given-names>Y.</given-names></name>
<name><surname>Yang</surname> <given-names>X.</given-names></name>
<name><surname>Bhat</surname> <given-names>J. A.</given-names></name>
<name><surname>Zhang</surname> <given-names>Y.</given-names></name>
<name><surname>Bu</surname> <given-names>M.</given-names></name>
<name><surname>Zhao</surname> <given-names>B.</given-names></name>
<etal/>
</person-group>. (<year>2024</year>b). 
<article-title>Identification of superior haplotypes and candidate gene for seed size-related traits in soybean (<italic>Glycine max</italic> L.)</article-title>. <source>Mol. Breed.</source> <volume>45</volume>, <elocation-id>3</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11032-024-01525-1</pub-id>, PMID: <pub-id pub-id-type="pmid">39717350</pub-id>
</mixed-citation>
</ref>
<ref id="B97">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhang</surname> <given-names>D.</given-names></name>
<name><surname>Zhang</surname> <given-names>H.</given-names></name>
<name><surname>Hu</surname> <given-names>Z.</given-names></name>
<name><surname>Chu</surname> <given-names>S.</given-names></name>
<name><surname>Yu</surname> <given-names>K.</given-names></name>
<name><surname>Lv</surname> <given-names>L.</given-names></name>
<etal/>
</person-group>. (<year>2019</year>). 
<article-title>Artificial selection on <italic>GmOLEO1</italic> contributes to the increase in seed oil during soybean domestication</article-title>. <source>PloS Genet.</source> <volume>15</volume>, <fpage>e1008267</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pgen.1008267</pub-id>, PMID: <pub-id pub-id-type="pmid">31291251</pub-id>
</mixed-citation>
</ref>
<ref id="B98">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhao</surname> <given-names>X.</given-names></name>
<name><surname>Zhang</surname> <given-names>Y.</given-names></name>
<name><surname>Wang</surname> <given-names>J.</given-names></name>
<name><surname>Zhao</surname> <given-names>X.</given-names></name>
<name><surname>Li</surname> <given-names>Y.</given-names></name>
<name><surname>Teng</surname> <given-names>W.</given-names></name>
<etal/>
</person-group>. (<year>2024</year>). 
<article-title>GWAS and WGCNA analysis uncover candidate genes associated with oil content in soybean</article-title>. <source>Plants</source> <volume>13</volume>, <fpage>1351</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/plants13101351</pub-id>, PMID: <pub-id pub-id-type="pmid">38794422</pub-id>
</mixed-citation>
</ref>
<ref id="B99">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zheng</surname> <given-names>H.</given-names></name>
<name><surname>Feng</surname> <given-names>X.</given-names></name>
<name><surname>Wang</surname> <given-names>L.</given-names></name>
<name><surname>Shao</surname> <given-names>W.</given-names></name>
<name><surname>Guo</surname> <given-names>S.</given-names></name>
<name><surname>Zhao</surname> <given-names>D.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>GmSop20 functions as a key coordinator of the oil-to-protein ratio in soybean seeds</article-title>. <source>Advanced Sci.</source> <volume>12</volume>(<issue>38</issue>), <fpage>e05181</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/advs.202505181</pub-id>, PMID: <pub-id pub-id-type="pmid">40679091</pub-id>
</mixed-citation>
</ref>
<ref id="B100">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhou</surname> <given-names>C.</given-names></name>
<name><surname>Wang</surname> <given-names>H.</given-names></name>
<name><surname>Zhu</surname> <given-names>X.</given-names></name>
<name><surname>Li</surname> <given-names>Y.</given-names></name>
<name><surname>Zhang</surname> <given-names>B.</given-names></name>
<name><surname>Tadege</surname> <given-names>M.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>Functional genomics: from soybean to legume</article-title>. <source>Int. J. Mol. Sci.</source> <volume>26</volume>, <fpage>6323</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/ijms26136323</pub-id>, PMID: <pub-id pub-id-type="pmid">40650105</pub-id>
</mixed-citation>
</ref>
<ref id="B101">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhukov</surname> <given-names>A.</given-names></name>
<name><surname>Popov</surname> <given-names>V.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>Synthesis of C<sub>20&#x2013;38</sub> fatty acids in plant tissues</article-title>. <source>Int. J. Mol. Sci.</source> <volume>23</volume>, <fpage>4731</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/ijms23094731</pub-id>, PMID: <pub-id pub-id-type="pmid">35563119</pub-id>
</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn id="n1" fn-type="custom" custom-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/382119">Hasan Mehraj</ext-link>, The University of Tokyo, Japan</p></fn>
<fn id="n2" fn-type="custom" custom-type="reviewed-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/496329">Jianbo He</ext-link>, Nanjing Agricultural University, China</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1598119">Min Zhang</ext-link>, Chinese Academy of Sciences (CAS), China</p></fn>
</fn-group>
</back>
</article>