<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2022.1045953</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Identification of loci governing soybean seed protein content <italic>via</italic> genome-wide association study and selective signature analyses</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Hongmei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/700561"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Guwen</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/294925"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Wei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Qiong</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1241808"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Xu</surname>
<given-names>Wenjing</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Liu</surname>
<given-names>Xiaoqing</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Cui</surname>
<given-names>Xiaoyan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/911997"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Chen</surname>
<given-names>Xin</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/583958"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Chen</surname>
<given-names>Huatao</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1365796"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Institute of Industrial Crops, Jiangsu Academy of Agricultural Sciences</institution>, <addr-line>Nanjing Jiangsu</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Institute of Vegetables, Zhejiang Academy of Agricultural Sciences</institution>, <addr-line>Hangzhou Zhejiang</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>College of Horticulture, Nanjing Agricultural University</institution>, <addr-line>Nanjing, Jiangsu</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Khalid Meksem, Southern Illinois University Carbondale, United States</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Nacer Bellaloui, Agricultural Research Service (USDA), United States; Milad Eskandari, University of Guelph, Canada</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Huatao Chen, <email xlink:href="mailto:cht@jaas.ac.cn">cht@jaas.ac.cn</email>
</p>
</fn>
<fn fn-type="equal" id="fn003">
<p>&#x2020;These authors have contributed equally to this work</p>
</fn>
<fn fn-type="other" id="fn002">
<p>This article was submitted to Plant Breeding, a section of the journal Frontiers in Plant Science</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>02</day>
<month>12</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>13</volume>
<elocation-id>1045953</elocation-id>
<history>
<date date-type="received">
<day>20</day>
<month>09</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>21</day>
<month>11</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 Zhang, Zhang, Zhang, Wang, Xu, Liu, Cui, Chen and Chen</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Zhang, Zhang, Zhang, Wang, Xu, Liu, Cui, Chen and Chen</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Soybean [<italic>Glycine max</italic> (L.) Merr.] is an excellent source of protein. Understanding the genetic basis of protein content (PC) will accelerate breeding efforts to increase soybean quality. In the present study, a genome-wide association study (GWAS) was applied to detect quantitative trait loci (QTL) for PC in soybean using 264 re-sequenced soybean accessions and a high-quality single nucleotide polymorphism (SNP) map. Eleven QTL were identified as associated with PC. The QTL <italic>qPC-14</italic> was detected by GWAS in both environments and was shown to have undergone strong selection during soybean improvement. Fifteen candidate genes were identified in <italic>qPC-14</italic>, and three candidate genes showed differential expression between a high-PC and a low-PC variety during the seed development stage. The QTL identified here will be of significant use in molecular breeding efforts, and the candidate genes will play essential roles in exploring the mechanisms of protein biosynthesis.</p>
</abstract>
<kwd-group>
<kwd>protein content</kwd>
<kwd>GWAS</kwd>
<kwd>Selective signature analysis</kwd>
<kwd>candidate genes</kwd>
<kwd>soybean</kwd>
</kwd-group>
<contract-sponsor id="cn001">National Key Research and Development Program of China<named-content content-type="fundref-id">10.13039/501100012166</named-content>
</contract-sponsor>
<contract-sponsor id="cn002">Jiangsu Agricultural Science and Technology Innovation Fund<named-content content-type="fundref-id">10.13039/100007540</named-content>
</contract-sponsor>
<contract-sponsor id="cn003">National Natural Science Foundation of China<named-content content-type="fundref-id">10.13039/501100001809</named-content>
</contract-sponsor>
<contract-sponsor id="cn004">Natural Science Foundation of Jiangsu Province<named-content content-type="fundref-id">10.13039/501100004608</named-content>
</contract-sponsor>
<counts>
<fig-count count="4"/>
<table-count count="2"/>
<equation-count count="1"/>
<ref-count count="29"/>
<page-count count="8"/>
<word-count count="3822"/>
</counts>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<title>Introduction</title>
<p>Approximately 68% of the protein powder produced worldwide is derived from soybean [<italic>Glycine max</italic> (L.) Merr.]. Furthermore, meat producers have found soybean meal to be the preferred protein source for poultry and livestock. The demand for higher protein content (PC) over recent years has pushed breeders to develop soybean seeds with higher levels of protein (<xref ref-type="bibr" rid="B15">Patil et&#xa0;al., 2017</xref>). It is therefore important to understand the variation in soybean seed PC. Breeding high-protein soybean varieties is of great significance for increasing soybean protein yield. However, understanding of the mechanism(s) controlling variation in PC is limited.</p>
<p>In recent decades, 252 quantitative trait loci (QTL) on 20 chromosomes have been discovered for soybean PC and published in the Soybean Genetics and Genomics Database (<uri xlink:href="https://www.soybase.org/">https://www.soybase.org/</uri>). Biparental populations were used as the genetic background in the studies that uncovered 248 of those QTL. <xref ref-type="bibr" rid="B3">Diers et&#xa0;al. (1992)</xref> evaluated 60 F<sub>2:3</sub> lines (A81-356022&#xd7;PI 468916) with a restriction fragment length polymorphism (RFLP) linkage map of soybean containing 252 markers over 2,147 cM. They identified eight major QTL associated with PC in linkage groups A, C, and K, which explained 12-42% of the phenotypic variation. A major QTL for PC was detected on chromosome 14, which explained 12.4% of the phenotypic variation (<xref ref-type="bibr" rid="B25">Zhang et&#xa0;al., 2004</xref>). The resolution of QTL mapping <italic>via</italic> biparental populations was also successfully used to validate major QTL for PC (<xref ref-type="bibr" rid="B21">Wang et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B22">Warrington et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B16">Piyaporn et&#xa0;al., 2016</xref>). However, the higher confidence intervals and lower genetic variation in biparental populations cause challenges in integrating the results of linkage mapping into breeding programs; genome-wide association studies (GWAS) are thus preferred to study all recombination events that have occurred in the linkage disequilibrium (LD)-based evolutionary history of natural populations (<xref ref-type="bibr" rid="B12">Li et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B28">Zhang et&#xa0;al., 2021</xref>).</p>
<p>In association panels, characteristics such as LD, genetic diversity, marker density, and population structure affect the resolution and accuracy of QTL detected <italic>via</italic> GWAS (<xref ref-type="bibr" rid="B19">Sonah et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B27">Zhang et&#xa0;al., 2022</xref>). In recent years, GWAS have not only been applied to different populations to identify QTL associated with PC in soybean (<xref ref-type="bibr" rid="B19">Sonah et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B24">Zhang et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B12">Li et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B26">Zhang T et al., 2019</xref>), but have also been applied to analyze other complex quantitative traits such as oil content, salt stress tolerance, agronomic traits, and yield-related traits (<xref ref-type="bibr" rid="B7">Hwang et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B4">Fang et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B24">Zhang W et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B14">Pang et&#xa0;al., 2020</xref>). These findings have confirmed GWAS as a suitable approach for identifying novel QTL.</p>
<p>To identify novel components of the genetic architecture underlying PC, we here re-sequenced 264 soybean accessions and analyzed the genomes with a high-resolution single nucleotide polymorphism (SNP) map. In total, 11 QTL related to PC were identified. One QTL that was significantly associated with PC, <italic>qPC-14</italic>, was shown to have undergone selection during soybean improvement. Three candidate genes exhibiting differential expression between cultivars during the seed development stage may be involved in regulating soybean PC. The genes and SNPs identified here are expected to contribute to cultivation of high-protein soybean varieties through marker-assisted selection (MAS) programs.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<title>Materials and methods</title>
<sec id="s2_1">
<title>Plant materials and phenotypic measurements</title>
<p>There were 264 accessions in the soybean population: 52 landraces and 212 improved varieties (<xref ref-type="bibr" rid="B28">Zhang et&#xa0;al., 2021</xref>). All materials were planted in Sanya City, Hainan Province (109.70&#xb0; E, 18.31&#xb0;N) in 2020 (E1), and in Nanjing City, Jiangsu Province (118.68&#xb0;E, 32.50&#xb0;N) in 2021 (E2). The experimental plots utilized a randomized complete block design in one row with three replicates. The dimensions for single row seeding were 4&#xa0;m length by 0.5&#xa0;m width with 0.13&#xa0;m spacing. Seeds from duplicate samples were pooled and dried in an oven to a constant weight.</p>
<p>For each replication, 20&#xa0;g of seeds were ground with a 1095 Knifetec sample mill (FOSS Tecator, Denmark). All grains were sieved (0.25&#xa0;mm pore size) into sample bottles. For each sample, 0.2&#xa0;g was weighed out and placed in a 300 mL disboil tube. Protein content was then determined using the Kjeldahl protein analyzer (SKD-1800) according to <xref ref-type="bibr" rid="B1">Bremner (1960)</xref>.</p>
</sec>
<sec id="s2_2">
<title>Statistical analyses of phenotypic data</title>
<p>Descriptive statistics and <italic>h</italic>
<sup>2</sup> were calculated in R (<uri xlink:href="http://www.Rproject.org/">http://www.Rproject.org/</uri>). The formula for <italic>h</italic>
<sup>2</sup> was as follows:</p>
<disp-formula>
<mml:math display="block" id="M1">
<mml:mrow>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:msubsup>
<mml:mi>&#x3c3;</mml:mi>
<mml:mi>g</mml:mi>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:mo>&#x2215;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msubsup>
<mml:mi>&#x3c3;</mml:mi>
<mml:mi>g</mml:mi>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:mo>+</mml:mo>
<mml:msubsup>
<mml:mi>&#x3c3;</mml:mi>
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mi>e</mml:mi>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:mo>&#x2215;</mml:mo>
<mml:mi>n</mml:mi>
<mml:mo>+</mml:mo>
<mml:msup>
<mml:mi>&#x3c3;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>&#x2215;</mml:mo>
<mml:mi>n</mml:mi>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <italic>&#x3c3;</italic>
<sup>2</sup>
<sub>g</sub> is the genotypic variance, <italic>&#x3c3;</italic>
<sup>2</sup>
<sub>ge</sub> is the genotype by environmental interaction variance, <italic>&#x3c3;</italic>
<sup>2</sup> is the error variance, <italic>n</italic> is the number of environments, and <italic>r</italic> is the number of replicates. Bar graphs and line graphs were generated in Origin v8.0.</p>
</sec>
<sec id="s2_3">
<title>Genotyping and GWAS</title>
<p>The germplasm resource population contained 264 accessions. The physical distance of the LD decay was estimated as the position at which <italic>r<sup>2</sup>
</italic> decreased to half of its maximum value (~120 kb) (<xref ref-type="bibr" rid="B28">Zhang et&#xa0;al., 2021</xref>). A total of 2,597,425 SNPs were used in the GWAS (<xref ref-type="bibr" rid="B28">Zhang et&#xa0;al., 2021</xref>). MLMs were generated using the Genomic Association and Prediction Integrated Tool (&#x2018;GAPIT&#x2019;) package in R. To reduce false positives and increase statistical accuracy (<xref ref-type="bibr" rid="B10">Lipka et&#xa0;al., 2012</xref>), -log<sub>10</sub>(<italic>p</italic>) &gt; 5 was set as the threshold for a correlation to be considered significant.</p>
</sec>
<sec id="s2_4">
<title>Selective sweep analyses</title>
<p>The VCFtools package (<xref ref-type="bibr" rid="B2">Danecek et&#xa0;al., 2011</xref>) was used to analyze the nucleotide diversity (&#x3c0;) and <italic>F<sub>ST</sub>
</italic> between landraces and cultivars using a 10 kb step size and a 100 kb sliding window. The top 5% of <italic>&#x3b8;</italic>
<sub>&#x3c0;</sub> ratios and <italic>F<sub>ST</sub>
</italic> values were classified as putative selective regions and highly differentiated regions, respectively. The window intersection areas of <italic>F<sub>ST</sub>
</italic> and <italic>&#x3b8;</italic>
<sub>&#x3c0;</sub> ratio were designated as potential selective regions. <italic>F<sub>ST</sub>
</italic>&#x2265; 0.204 and <italic>&#x3b8;</italic>
<sub>&#x3c0;</sub> ratio&lt; 0.545 were the thresholds used for landraces vs. cultivars in the selective sweep analysis.</p>
</sec>
<sec id="s2_5">
<title>RT&#x2212;PCR for candidate genes</title>
<p>Two soybean genotypes were used to examine differences in the expression of genes related to soybean PC accumulation during seed development <italic>via</italic> transcriptomics: NPS233 (high PC) and NPS301 (low PC). These two varieties exhibiting different genotypes and protein content, in which NPS233 with S14_73926-A and NPS301 with SNP S14_73926-G. Seed samples were collected from the two accessions at 14, 21, and 28 DAF, then immediately frozen in liquid nitrogen and stored at -80&#xb0;C prior to further use.</p>
<p>Total RNA was extracted using an RNAsimple Total RNA Kit (TIANGEN, China). First-strand cDNA synthesis was conducted with a TaKaRa Primer Script RT reagent kit and gDNA Eraser. RT-PCR was performed on an ABI 7500 system (Applied Biosystems, USA) using SYBR Green Real-time Master Mix (Toyobo). Tubulin (GenBank accession number: AY907703) was used as the internal control for expression normalization.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<title>Results</title>
<sec id="s3_1">
<title>Phenotypic variation in PC</title>
<p>A total of 264 soybean accessions were used in this study. Seed PC was measured in soybeans grown in 2020 (E1) and 2021 (E1) (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). In addition, the mean value of E1 and E2, named as Combined, was used for data analysis. It was shown that differences in PC in the natural population were significant in E1,E2, and Combined (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1A</bold>
</xref> and <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). The range of soybean PC in the natural populations were 34.42% to 39.89% in E1, 33.46% to 48.53% in E2, and 35.18% and 49.07%, (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref> and <xref ref-type="supplementary-material" rid="SM1">
<bold>Table S1</bold>
</xref>). The average PC in the natural population in Sanya was 41.17%, which was significantly higher than that of Nanjing (38.91%), indicating that PC was easily influenced by the growth environment. PC was normally distributed in the associated populations (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1B</bold>
</xref>), with extensive variation in trait phenotypes (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). The 66.43% generalized heritability (<italic>H<sup>2</sup>
</italic>) for PC indicated that genetic factors played a crucial role in soybean protein accumulation.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Descriptive statistics for soybean protein content of the natural population.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">En<sup>a</sup>
</th>
<th valign="top" align="center">Min (%)</th>
<th valign="top" align="center">Max (%)</th>
<th valign="top" align="center">Range<sup>b</sup>(%)</th>
<th valign="top" align="center">Mean &#xb1; SD<sup>c</sup>
</th>
<th valign="top" align="center">CV<sup>d</sup>(%)</th>
<th valign="top" align="center">
<italic>H<sup>2 e</sup>
</italic>(%)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">E1</td>
<td valign="top" align="center">34.42</td>
<td valign="top" align="center">49.89</td>
<td valign="top" align="center">15.47</td>
<td valign="top" align="center">41.17 &#xb1; 2.42</td>
<td valign="top" align="center">5.89</td>
<td valign="top" rowspan="3" align="center">66.43</td>
</tr>
<tr>
<td valign="top" align="left">E2</td>
<td valign="top" align="center">33.46</td>
<td valign="top" align="center">48.53</td>
<td valign="top" align="center">15.07</td>
<td valign="top" align="center">38.91 &#xb1; 2.10</td>
<td valign="top" align="center">5.4</td>
</tr>
<tr>
<td valign="top" align="left">Combined</td>
<td valign="top" align="center">35.18</td>
<td valign="top" align="center">49.07</td>
<td valign="top" align="center">13.89</td>
<td valign="top" align="center">40.03 &#xb1; 1.95</td>
<td valign="top" align="center">4.87</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>a E1, Sanya in 2020; E2, Nanjing in 2021, Combined, the mean value of E1 and E2. b Range, difference between maximum and minimum value. c Mean &#xb1; SD, mean &#xb1; standard deviation. d CV, coefficient of variation. e H2, broad-sense heritability.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Distribution of soybean seed protein content (PC). Boxplot <bold>(A)</bold> and frequency distribution <bold>(B)</bold> of soybean seed PC in E1, E2, and combined environment, respectively.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-13-1045953-g001.tif"/>
</fig>
</sec>
<sec id="s3_2">
<title>GWAS for PC in a natural population</title>
<p>GWAS was conducted to detect SNPs associated with PC across two environments using 2,597,425 SNPs reported in a previous study (<xref ref-type="bibr" rid="B28">Zhang et&#xa0;al., 2021</xref>). To minimize false positives, a mixed linear model (MLM) was applied. The Manhattan plots for the GWAS results are shown in <xref ref-type="fig" rid="f2">
<bold>Figures&#xa0;2A&#x2013;C</bold>
</xref>. PC was observed to be significantly correlated with 159 SNPs at a threshold of -log<sub>10</sub>(<italic>p</italic>) &gt; 5 (<xref ref-type="supplementary-material" rid="SM2">
<bold>Table S2</bold>
</xref>). The SNPs were distributed across 11 chromosomes in E1, E2, and combined environment (<xref ref-type="fig" rid="f2">
<bold>Figures&#xa0;2A&#x2013;C</bold>
</xref> and <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>) and were responsible for phenotypic variation from 5.48 to 9.20% (<xref ref-type="supplementary-material" rid="SM2">
<bold>Table S2</bold>
</xref>). Among the significant SNPs, 30 were located on Chr.14; one of these, <italic>qPC-14-1</italic>, was represented by a peak at SNP S14_73926 and was detected in both 2020, 2021, and combined environment (<italic>p</italic> = 8.56&#xd7;10<sup>-7</sup>, and 1.86&#xd7;10<sup>-6</sup>, 5.93&#xd7;10<sup>-8</sup> respectively). <italic>qPC-18-1</italic>, located on Chr. 18, contained 99 SNPs; it was seen as a peak at SNP S18_53913918 and explained 9.20% of the total phenotypic variation in 2021 and combined environment. Moreover, we observed that soybean accessions carrying the S14_73926-A allele exhibited significantly higher average PC than those carrying the S14_73926-G allele (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2D</bold>
</xref>). Furthermore, soybean varieties carrying the S18_53913918-C allele showed significantly lower average PC than those carrying the S18_53913918-T allele (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2E</bold>
</xref>). In summary, GWAS yielded several loci that could explain the genetic variation responsible for differences in PC between genotypes.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>GWAS for seed protein content (PC). Manhattan plot for seed PC in E1 <bold>(A)</bold>, E2 <bold>(B)</bold>, and combined <bold>(C)</bold>. The red line indicates the significance threshold at -log<sub>10</sub>(<italic>p</italic>) = 5. <bold>(D)</bold> Boxplots for seed PC based on the S14_73926-A/G alleles in 2020 and 2021. <bold>(E)</bold> Boxplots for seed PC based on the S18_53913918-G/T alleles in 2020 and 2021. ***p &lt; 0.001.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-13-1045953-g002.tif"/>
</fig>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Loci and SNPs significantly associated with protein content, predicted candidate genes and previously reported QTL for protein content at similar genome regions.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">QTL</th>
<th valign="top" align="center">Env<xref ref-type="table-fn" rid="fnT2_1">
<sup>a</sup>
</xref>
</th>
<th valign="top" align="center">Chr<xref ref-type="table-fn" rid="fnT2_2">
<sup>b</sup>
</xref>
</th>
<th valign="top" align="center">Position<xref ref-type="table-fn" rid="fnT2_3">
<sup>c</sup>
</xref>
</th>
<th valign="top" align="center">Lead SNP</th>
<th valign="top" align="center">&#x2212;log<sub>10</sub>(<italic>p</italic>)</th>
<th valign="top" align="center">
<italic>R</italic>
<sup>2</sup>(%)<xref ref-type="table-fn" rid="fnT2_4">
<sup>d</sup>
</xref>
</th>
<th valign="top" align="center">Known QTL</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">
<italic>qPC-3</italic>
</td>
<td valign="top" align="left">E2</td>
<td valign="top" align="left">Gm3</td>
<td valign="top" align="center">5232779</td>
<td valign="top" align="center">S03_5232779</td>
<td valign="top" align="center">5.70</td>
<td valign="top" align="center">6.38</td>
<td valign="top" align="left">Seed protein 4-9 (<xref ref-type="bibr" rid="B9">Lee et&#xa0;al., 1996</xref>);<break/>Seed protein 36-36 (<xref ref-type="bibr" rid="B13">Mao et&#xa0;al., 2013</xref>)</td>
</tr>
<tr>
<td valign="top" align="left">
<italic>qPC-5</italic>
</td>
<td valign="top" align="left">E2</td>
<td valign="top" align="left">Gm5</td>
<td valign="top" align="center">24270611</td>
<td valign="top" align="center">S05_24270611</td>
<td valign="top" align="center">5.46</td>
<td valign="top" align="center">6.07</td>
<td valign="top" align="left">Seed protein 36-1 (<xref ref-type="bibr" rid="B13">Mao et&#xa0;al., 2013</xref>);</td>
</tr>
<tr>
<td valign="top" align="left">
<italic>qPC-6</italic>
</td>
<td valign="top" align="left">E2</td>
<td valign="top" align="left">Gm6</td>
<td valign="top" align="center">13847565</td>
<td valign="top" align="center">S06_13847565</td>
<td valign="top" align="center">5.26</td>
<td valign="top" align="center">5.81</td>
<td valign="top" align="left">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="left">
<italic>qPC-8</italic>
</td>
<td valign="top" align="left">E2</td>
<td valign="top" align="left">Gm8</td>
<td valign="top" align="center">40497729</td>
<td valign="top" align="center">S08_40497729</td>
<td valign="top" align="center">5.01</td>
<td valign="top" align="center">5.48</td>
<td valign="top" align="left">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="left">
<italic>qPC-9</italic>
</td>
<td valign="top" align="left">E2</td>
<td valign="top" align="left">Gm9</td>
<td valign="top" align="center">18127054</td>
<td valign="top" align="center">S09_18127054</td>
<td valign="top" align="center">6.15</td>
<td valign="top" align="center">6.97</td>
<td valign="top" align="left">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="left">
<italic>qPC-10</italic>
</td>
<td valign="top" align="left">E2</td>
<td valign="top" align="left">Gm10</td>
<td valign="top" align="center">16047138</td>
<td valign="top" align="center">S10_16047138</td>
<td valign="top" align="center">5.45</td>
<td valign="top" align="center">6.05</td>
<td valign="top" align="left">Seed protein 36-40 (<xref ref-type="bibr" rid="B13">Mao et&#xa0;al., 2013</xref>)</td>
</tr>
<tr>
<td valign="top" align="left">
<italic>qPC-14</italic>
</td>
<td valign="top" align="left">E1,E2, combined</td>
<td valign="top" align="left">Gm14</td>
<td valign="top" align="center">73926</td>
<td valign="top" align="center">S14_73926</td>
<td valign="top" align="center">6.07</td>
<td valign="top" align="center">8.45</td>
<td valign="top" align="left">Seed protein 4-g4 (<xref ref-type="bibr" rid="B19">Sonah et&#xa0;al., 2015</xref>)</td>
</tr>
<tr>
<td valign="top" align="left">
<italic>qPC-16-1</italic>
</td>
<td valign="top" align="left">E1</td>
<td valign="top" align="left">Gm16</td>
<td valign="top" align="center">27931926</td>
<td valign="top" align="center">S16_27931926</td>
<td valign="top" align="center">5.14</td>
<td valign="top" align="center">6.97</td>
<td valign="top" align="left">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="left">
<italic>qPC-16-2</italic>
</td>
<td valign="top" align="left">E2</td>
<td valign="top" align="left">Gm16</td>
<td valign="top" align="center">6800169</td>
<td valign="top" align="center">S16_6800169</td>
<td valign="top" align="center">6.85</td>
<td valign="top" align="center">7.90</td>
<td valign="top" align="left">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="left">
<italic>qPC-17</italic>
</td>
<td valign="top" align="left">E1</td>
<td valign="top" align="left">Gm17</td>
<td valign="top" align="center">1545686</td>
<td valign="top" align="center">S17_1545686</td>
<td valign="top" align="center">5.46</td>
<td valign="top" align="center">7.47</td>
<td valign="top" align="left">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="left">
<italic>qPC-18</italic>
</td>
<td valign="top" align="left">E1, combined</td>
<td valign="top" align="left">Gm18</td>
<td valign="top" align="center">53913918</td>
<td valign="top" align="center">S18_53913918</td>
<td valign="top" align="center">6.52</td>
<td valign="top" align="center">9.20</td>
<td valign="top" align="left">Seed protein 1-8 (<xref ref-type="bibr" rid="B3">Diers et&#xa0;al., 1992</xref>),</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="fnT2_1">
<label>a</label>
<p>Environment.</p>
</fn>
<fn id="fnT2_2">
<label>b</label>
<p>Chromosome.</p>
</fn>
<fn id="fnT2_3">
<label>c</label>
<p>Most significant SNP position.</p>
</fn>
<fn id="fnT2_4">
<label>d</label>
<p>The proportion of phenotypic variance explained by each QTL.</p>
</fn>
<fn>
<p>E1 and E2 represent two environments, 2020-year, and 2021-year, respectively.</p>
</fn>
<fn>
<p>Combined means the average value of E1 and E2.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3_3">
<title>
<italic>qPC-14</italic> is an improvement-selective QTL</title>
<p>Wild soybean often has higher seed PC than landraces or improved cultivars, suggesting that seed PC has been under selection during soybean domestication and varietal improvement. Our previous study detected 39 improvement-selective regions for seed PC in a natural population containing 52 landraces and 212 cultivars (<xref ref-type="bibr" rid="B28">Zhang et&#xa0;al., 2021</xref>). In the present study, <italic>qPC-14</italic>, represented by SNP S14_73926, was located within a selective sweep region ~270 kb in size (Chr14: 0&#x2013;270,000) as inferred by the fixation index (<italic>F</italic>
<sub>ST</sub>) (&#x2265; 0.204) (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3A</bold>
</xref>) and <italic>&#x3b8;</italic>
<sub>&#x3c0;</sub> ratio (&lt; 0.545) (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3B</bold>
</xref>). The data suggested that this GWAS signal, which was significantly associated with seed PC, had undergone strong selection during soybean improvement. Interestingly, we also observed that the frequency of the S14_73926-A allele was 30.8% in landraces, significantly higher than the 3.0% frequency in cultivars (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3C</bold>
</xref>). This difference was associated with a higher average seed PC in landraces (42.61% and 40.54%) than in cultivars (40.83% and 38.51%) (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3D</bold>
</xref>). Taken together, these results indicated that we identified a critical QTL for soybean PC through GWAS in the present study.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>
<bold>(A)</bold> Nucleotide diversity (&#x3c0;) values in landraces and improved cultivars. <bold>(B)</bold> Fixation index (<italic>F</italic>
<sub>ST</sub>) plot of landraces and cultivars in the 600-kb genomic regions surrounding the lead SNP, S14_73926, in <italic>qPC-14-1.</italic> <bold>(C)</bold> Allele frequencies of S14_73926 in landraces and cultivars. A and G are the two different alleles for the SNP S14_73926. <bold>(D)</bold> Boxplot of soybean seed protein content (PC) in landraces and cultivars grown in 2020 and 2021. ***p &lt; 0.001.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-13-1045953-g003.tif"/>
</fig>
</sec>
<sec id="s3_4">
<title>Candidate genes for PC</title>
<p>To identify candidate genes, we studied the 120 kb region flanking a significant representative SNP (S14_73926) based on the LD decay distance reported in a previous study (<xref ref-type="bibr" rid="B28">Zhang et&#xa0;al., 2021</xref>). Fifteen candidate genes were predicted in this region (<xref ref-type="supplementary-material" rid="SM3">
<bold>Table S3</bold>
</xref>). To determine which genes affected seed PC, quantitative reverse transcription (qRT)-PCR was conducted to analyze spatiotemporal expression patterns of the 15 candidate genes during seed development. Samples were collected from two soybean lines, NPS233 (with SNP S14_73926-A, a high protein variety) and NPS301 (with SNP S14_73926-G, a low protein variety) at 14, 21, and 28&#xa0;d after flowering (DAF). The expression levels of two genes was too lowly to be detected (<italic>Glyma.14g000100</italic>, <italic>Glyma.14g000200</italic>, and <italic>Glyma.14G000900</italic>), and nine showed no significant differences in expression levels between NPS233 and NPS301 (<italic>Glyma.14G000300</italic>, <italic>Glyma.14G000400</italic>, <italic>Glyma.14G000500</italic>, <italic>Glyma.14G000700</italic>, <italic>Glyma.14G000800</italic>, <italic>Glyma.14G001100</italic>, <italic>Glyma.14G001200</italic>, <italic>Glyma.14G001300</italic>, and <italic>Glyma.14G001500</italic>). At 14 DAF, <italic>Glyma.14G000600</italic> was expressed at low levels with no significant difference between NPS233 and NPS301; however, this gene was then strongly downregulated in NPS233 compared to NPS301 (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>). Relative expression of <italic>Glyma.14G001000</italic> was significantly lower in NPS233 than in NPS301 during the seed development stage (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4B</bold>
</xref>). In addition, <italic>Glyma.14G001400</italic> was more highly expressed in NPS301 than in NPS233 at 14 DAF, but there was no difference in expression at 21 or 28 DAF (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4B</bold>
</xref>).</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Relative expression patterns of <italic>Glyma.14g000600</italic> <bold>(A)</bold>, <italic>Glyma.14g001000</italic> <bold>(B)</bold>, and <italic>Glyma.14g001400</italic> <bold>(C)</bold> during seed development in the accessions NPS233 and NPS301. Seeds were sampled at 14, 21, and 28 days after flowering (DAF). *<italic>p</italic>&lt; 0.05, **<italic>p</italic>&lt; 0.01.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-13-1045953-g004.tif"/>
</fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<title>Discussion</title>
<p>The goal of the present study was to identify SNPs and candidate genes significantly associated with soybean PC variation. A natural soybean population was re-sequenced and planted in two different geographical locations (Sanya in 2020 and Nanjing in 2021), and the phenotypes used to conduct GWAS for PC. It has previously been reported that soybean varieties planted at high latitudes exhibit lower PC than those planted at low latitudes. In addition, soybean PC is known to be affected by environmental factors, such as day length, temperature, and moisture levels (<xref ref-type="bibr" rid="B20">Song et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B15">Patil et&#xa0;al., 2017</xref>). Here, the average PC of a natural population plated in Sanya was significantly higher than the same population planted in Nanjing (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). This suggests that combined climatic factors caused significant changes in PC and thus resulted in extensive phenotypic variation in the natural populations used for GWAS.</p>
<p>Over the past two decades, a great deal of research has been published related to genetic dissection of soybean PC. More than 200 QTL across 20 chromosomes have been identified as associated with seed PC (SoyBase, <uri xlink:href="http://www.soybase.org/">http://www.soybase.org/</uri>). A QTL related to seed PC and oil content has been located on Chr. 20 (<xref ref-type="bibr" rid="B3">Diers et&#xa0;al., 1992</xref>; <xref ref-type="bibr" rid="B7">Hwang et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B22">Warrington et&#xa0;al., 2015</xref>), and it has received extensive attention because of its high additive effects and stability (<xref ref-type="bibr" rid="B3">Diers et&#xa0;al., 1992</xref>; <xref ref-type="bibr" rid="B21">Wang et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B12">Li et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B18">Samanfar et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B23">Zhang W et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B11">Li et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B5">Goettel et&#xa0;al., 2022</xref>). <italic>Glyma.20G085100</italic> (<italic>POWR1</italic>) was recently reported as a causative gene of chr20 QTL; a transposable element insertion in its conserved CCT domain produced seeds with increased oil content and weight and decreased PC (<xref ref-type="bibr" rid="B5">Goettel et&#xa0;al., 2022</xref>). However, few QTL or genes related to PC have been applied in breeding due to limitations such as insignificant and unstable effects on phenotypes, negative correlations with seed oil and seed yield, and inconsistencies between growing environments (<xref ref-type="bibr" rid="B21">Wang et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B5">Goettel et&#xa0;al., 2022</xref>). It is therefore imperative to identify QTL with consistent and large effects on PC. In this study, to detect significant SNPs related to PC, a high-density map from a previous study (<xref ref-type="bibr" rid="B28">Zhang et&#xa0;al., 2021</xref>) was used. This map contained 2,597,425 SNPs, corresponding to ~2.6 SNP markers per kb, improving the precision of GWAS for studying complex traits. Eleven QTL for PC were detected <italic>via</italic> GWAS with an MLM method. Five were close to or overlapping with regions reported in previous studies, whereas six are reported here for the first time (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). The QTL <italic>qPC-3</italic> identified here was located within three other QTL: <italic>seed protein 4-9</italic> (<xref ref-type="bibr" rid="B9">Lee et&#xa0;al., 1996</xref>), <italic>seed protein 36-36</italic>, and <italic>seed protein 36-40</italic> (<xref ref-type="bibr" rid="B13">Mao et&#xa0;al., 2013</xref>). <italic>qPC-5</italic> and <italic>qPC-10</italic> were each located within a previously mapped QTL, <italic>seed protein 36-1</italic> and <italic>seed protein 36-40</italic>, respectively (<xref ref-type="bibr" rid="B13">Mao et&#xa0;al., 2013</xref>). Although <italic>qPC-18</italic> was found to be associated with PC in 2020 and the SNP S18_53913918 accounted for 9.20% of the phenotypic variation, it also overlapped with a previously reported QTL (<xref ref-type="bibr" rid="B3">Diers et&#xa0;al., 1992</xref>), <italic>seed protein 1-8</italic> on Chr.18. <italic>qPC-14</italic> was significantly associated with PC in both 2020 and 2021 (<xref ref-type="supplementary-material" rid="SM2">
<bold>Table S2</bold>
</xref>). A previous GWAS showed that some SNP loci in this region regulated PC (<xref ref-type="bibr" rid="B19">Sonah et&#xa0;al., 2015</xref>). These results suggested that there are genes in these regions that regulate seed PC; future work should aim to identify candidate genes in these regions.</p>
<p>In China, demand for soybean has increased rapidly, and 80% of soybeans consumed were imported from Brazil and the United States of America in recent years. This trend has caused many breeders to prioritize high seed yield in recent years. However, there is a negative correlation between seed yield and PC (<xref ref-type="bibr" rid="B17">Rotundo et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B15">Patil et&#xa0;al., 2017</xref>), which prevents simultaneous increases in seed PC and yield. The breeding objective of high yield may result in development of more improved varieties with higher seed yield and lower PC compared with landrace varieties. Indeed, we found that the average PC was much higher in landrace varieties than in cultivars (<italic>p</italic>&lt; 0.01).</p>
<p>Wild soybean is known to have much higher seed PC than landraces and cultivars (<xref ref-type="bibr" rid="B7">Hwang et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B8">Leamy et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B12">Li et&#xa0;al., 2019</xref>). This suggests that seed PC has undergone selection during domestication and improvement (<xref ref-type="bibr" rid="B5">Goettel et&#xa0;al., 2022</xref>). Domestication and improvement always resulted in selective sweeps, and significantly reduced nucleotide diversity in some regions of the genome (<xref ref-type="bibr" rid="B6">Hufford et&#xa0;al., 2012</xref>; <xref ref-type="bibr" rid="B29">Zhou et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B28">Zhang et&#xa0;al., 2021</xref>).Recently, a domestication gene, <italic>POWR1</italic>, was reported to regulate soybean protein content likely through controlling seed nutrient transport and lipid metabolism genes (<xref ref-type="bibr" rid="B5">Goettel et&#xa0;al., 2022</xref>). In the present study, to detect improvement-selection signals using soybean varieties collected from China, we scanned genomic regions with extreme allele frequency differences as described in our previous study (<xref ref-type="bibr" rid="B28">Zhang et&#xa0;al., 2021</xref>). An improvement-selection region was identified on Chr.14, which was overlapped with QTL <italic>qPC</italic>-<italic>14</italic> identified in this study. These results indicated that this QTL may have undergone selection during soybean improvement and was therefore a strong candidate gene for PC.</p>
</sec>
<sec id="s5" sec-type="conclusions">
<title>Conclusions</title>
<p>Using a GWAS approach, 11 QTL were determined to be associated with PC in soybean. A reproducible and significant QTL, <italic>qPC-14</italic>, overlapped with a selective-sweep region on Chr.14, demonstrating that this QTL had undergone selection during soybean improvement. Three candidate genes showed differential expression patterns between the high PC accession NPS233 and the low PC accession NPS301 during seed development, and these genes may therefore regulate PC in soybean. The results presented here contribute to an improved understanding of the mechanisms that regulate PC in soybean seeds.</p>
</sec>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material</bold>
</xref>. Further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>Conceptualization, HC. Formal analysis, HZ, WZ, and QW. Data curation, HZ and HC. Methodology, WZ, QW and WX. Investigation, HZ, and WX. Resources, HC and GZ. Funding acquisition, TH. Writing&#x2014;original draft, HZ, and WZ. Writing&#x2014;review and editing, HC, GZ, XL, XCu and XCh. All authors contributed to the article and approved the submitted version.</p>
</sec>
<sec id="s8" sec-type="funding-information">
<title>Funding</title>
<p>This study was supported by National Key Research and Development Program of China (2018YFE0112200), the Key R&amp;D project of Jiangsu Province (BE2019376), the open competition project of seed industry revitalization of Jiangsu Province (JBGS[2021]060), Jiangsu Agricultural Science and Technology Innovation Fund (CX(22)5002), the Natural Science Foundation of China (32001455), and the Natural Science Foundation of Jiangsu Province (BK20210154).</p>
</sec>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
</body>
<back>
<sec id="s11" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2022.1045953/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2022.1045953/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Table_1.xlsx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table_2.xlsx" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table_3.xlsx" id="SM3" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table_4.xlsx" id="SM4" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bremner</surname> <given-names>J. M.</given-names>
</name>
</person-group> (<year>1960</year>). <article-title>Determination of nitrogen in soil by the kjeldahl method</article-title>. <source>J. Agric. Sci.</source> <volume>55</volume>, <fpage>11</fpage>&#x2013;<lpage>33</lpage>. doi: <pub-id pub-id-type="doi">10.1017/S0021859600021572</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Danecek</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Auton</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Abecasis</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Albers</surname> <given-names>C. A.</given-names>
</name>
<name>
<surname>Banks</surname> <given-names>E.</given-names>
</name>
<name>
<surname>DePristo</surname> <given-names>M. A.</given-names>
</name>
<etal/>
</person-group>. (<year>2011</year>). <article-title>The variant call format and VCFtools</article-title>. <source>Bioinf. (Oxford England)</source> <volume>27</volume>, <fpage>2156</fpage>&#x2013;<lpage>2158</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btr330</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Diers</surname> <given-names>B. W.</given-names>
</name>
<name>
<surname>Keim</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Fehr</surname> <given-names>W. R.</given-names>
</name>
<name>
<surname>Shoemaker</surname> <given-names>R. C.</given-names>
</name>
</person-group> (<year>1992</year>). <article-title>RFLP analysis of soybean seed protein and oil content</article-title>. <source>Theor. Appl. Genet.</source> <volume>83</volume>, <fpage>608</fpage>&#x2013;<lpage>612</lpage>. doi: <pub-id pub-id-type="doi">10.1007/BF00226905</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>R.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Genome-wide association studies dissect the genetic networks underlying agronomical traits in soybean</article-title>. <source>Genome Biol.</source> <volume>18</volume>, <fpage>161</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13059-017-1289-9</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goettel</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Qiao</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Hou</surname> <given-names>D.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>POWR1 is a domestication gene pleiotropically regulating seed quality and yield in soybean</article-title>. <source>Nat. Commun.</source> <volume>13</volume>, <fpage>3051</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41467-022-30314-7</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hufford</surname> <given-names>M. B.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>van Heerwaarden</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Pyh&#xe4;j&#xe4;rvi</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Chia</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Cartwright</surname> <given-names>R. A.</given-names>
</name>
<etal/>
</person-group>. (<year>2012</year>). <article-title>Comparative population genomics of maize domestication and improvement</article-title>. <source>Nat. Genet.</source> <volume>44</volume>, <fpage>808</fpage>&#x2013;<lpage>811</lpage>. doi: <pub-id pub-id-type="doi">10.1038/ng.2309</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hwang</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Song</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Jia</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Specht</surname> <given-names>J. E.</given-names>
</name>
<name>
<surname>Hyten</surname> <given-names>D. L.</given-names>
</name>
<name>
<surname>Costa</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2014</year>). <article-title>A genome-wide association study of seed protein and oil content in soybean</article-title>. <source>BMC Genomics</source> <volume>15</volume>, <fpage>1</fpage>. doi: <pub-id pub-id-type="doi">10.1186/1471-2164-15-1</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Leamy</surname> <given-names>L. J.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>C. Y.</given-names>
</name>
<name>
<surname>Song</surname> <given-names>B.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>A genome-wide association study of seed composition traits in wild soybean (Glycine soja)</article-title>. <source>BMC Genomics</source> <volume>18</volume>, <fpage>18</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12864-016-3397-4</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname> <given-names>S. H.</given-names>
</name>
<name>
<surname>Bailey</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Mian</surname> <given-names>M. A. R.</given-names>
</name>
<name>
<surname>Carter</surname> <given-names>T. E.</given-names>
</name>
<name>
<surname>Shipe</surname> <given-names>E. R.</given-names>
</name>
<name>
<surname>Ashley</surname> <given-names>D. A.</given-names>
</name>
<etal/>
</person-group>. (<year>1996</year>). <article-title>RFLP loci associated with soybean seed protein and oil content across populations and locations</article-title>. <source>Theor. Appl. Genet.</source> <volume>93</volume>, <fpage>649</fpage>&#x2013;<lpage>657</lpage>. doi: <pub-id pub-id-type="doi">10.1007/BF00224058</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lipka</surname> <given-names>A. E.</given-names>
</name>
<name>
<surname>Tian</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Peiffer</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Bradbury</surname> <given-names>P. J.</given-names>
</name>
<etal/>
</person-group>. (<year>2012</year>). <article-title>GAPIT: genome association and prediction integrated tool</article-title>. <source>Bioinformatics</source> <volume>28</volume>, <fpage>2397</fpage>&#x2013;<lpage>2399</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/bts444</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Qi</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Fang</surname> <given-names>Y.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Fine mapping QTL and mining genes for protein content in soybean by the combination of linkage and association analysis</article-title>. <source>Theor. Appl. Genet.</source> <volume>134</volume>, <fpage>1095</fpage>&#x2013;<lpage>1122</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00122-020-03756-0</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Han</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Xie</surname> <given-names>F.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Genome-wide association mapping for seed protein and oil contents using a large panel of soybean accessions</article-title>. <source>Genomics</source> <volume>111</volume>, <fpage>90</fpage>&#x2013;<lpage>95</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ygeno.2018.01.004</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mao</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Han</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Teng</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>W.</given-names>
</name>
<etal/>
</person-group>. (<year>2013</year>). <article-title>Identification of quantitative trait loci underlying seed protein and oil contents of soybean across multi-genetic backgrounds and environments</article-title>. <source>Plant Breed.</source> <volume>6</volume>, <fpage>630</fpage>&#x2013;<lpage>641</lpage>. doi: <pub-id pub-id-type="doi">10.1111/pbr.12091</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>D.</given-names>
</name>
<name>
<surname>St. Amand</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Bernardo</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>W.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>High-resolution genome-wide association study identifies genomic regions and candidate genes for important agronomic traits in wheat</article-title>. <source>Mol. Plant</source> <volume>13</volume>, <fpage>1311</fpage>&#x2013;<lpage>1327</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.molp.2020.07.008</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Patil</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Mian</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Vuong</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Pantalone</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Song</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>P.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Molecular mapping and genomics of soybean seed protein: a review and perspective for the future</article-title>. <source>Theor. Appl. Genet.</source> <volume>130</volume>, <fpage>1975</fpage>&#x2013;<lpage>1991</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00122-017-2955-8</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Piyaporn</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Watcharin</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Hyten</surname> <given-names>D. L.</given-names>
</name>
<name>
<surname>Qijian</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Cregan</surname> <given-names>P. B.</given-names>
</name>
<name>
<surname>Graef</surname> <given-names>G. L.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>Multi-population selective genotyping to identify soybean [<italic>Glycine max</italic> (L.) merr.] seed protein and oil QTLs</article-title>. <source>G3 (Bethesda Md.)</source> <volume>6</volume>, <fpage>1635</fpage>&#x2013;<lpage>1648</lpage>. doi: <pub-id pub-id-type="doi">10.1534/g3.116.027656</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rotundo</surname> <given-names>J. L.</given-names>
</name>
<name>
<surname>Borr&#xe1;s</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Westgate</surname> <given-names>M. E.</given-names>
</name>
<name>
<surname>Orf</surname> <given-names>J. H.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Relationship between assimilate supply per seed during seed filling and soybean seed composition</article-title>. <source>Field Crop Res.</source> <volume>112</volume>, <fpage>90</fpage>&#x2013;<lpage>96</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.fcr.2009.02.004</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Samanfar</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Cober</surname> <given-names>E. R.</given-names>
</name>
<name>
<surname>Charette</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Tan</surname> <given-names>L. H.</given-names>
</name>
<name>
<surname>Bekele</surname> <given-names>W. A.</given-names>
</name>
<name>
<surname>Morrison</surname> <given-names>M. J.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Genetic analysis of high protein content in &#x2018;AC proteus&#x2019;related soybean populations using SSR, SNP, DArT and DArTseq markers</article-title>. <source>Sci. Rep-Uk</source> <volume>9</volume>, <fpage>19657</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-019-55862-9</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sonah</surname> <given-names>H.</given-names>
</name>
<name>
<surname>O'Donoughue</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Cober</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Rajcan</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Belzile</surname> <given-names>F.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Identification of loci governing eight agronomic traits using a GBS-GWAS approach and validation by QTL mapping in soya bean</article-title>. <source>Plant Biotechnol. J.</source> <volume>13</volume>, <fpage>211</fpage>&#x2013;<lpage>221</lpage>. doi: <pub-id pub-id-type="doi">10.1111/pbi.12249</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Song</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>Analyzing the effects of climate factors on soybean protein, oil contents, and composition by extensive and high-density sampling in China</article-title>. <source>J. Agr Food Chem.</source> <volume>64</volume>, <fpage>4121</fpage>&#x2013;<lpage>4130</lpage>. doi: <pub-id pub-id-type="doi">10.1021/acs.jafc.6b00008</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Shannon</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Zeng</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Orazaly</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>Identification and mapping of stable QTL for protein content in soybean seeds</article-title>. <source>Mol. Breed.</source> <volume>35</volume>, <fpage>92</fpage>. doi: <pub-id pub-id-type="doi">10.1007/s11032-015-0285-6</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Warrington</surname> <given-names>C. V.</given-names>
</name>
<name>
<surname>Abdel-Haleem</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Hyten</surname> <given-names>D. L.</given-names>
</name>
<name>
<surname>Cregan</surname> <given-names>P. B.</given-names>
</name>
<name>
<surname>Orf</surname> <given-names>J. H.</given-names>
</name>
<name>
<surname>Killam</surname> <given-names>A. S.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>QTL for seed protein and amino acids in the benning &#xd7; danbaekkong soybean population</article-title>. <source>Theor. Appl. Genet.</source> <volume>128</volume>, <fpage>839</fpage>&#x2013;<lpage>850</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00122-015-2474-4</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Liao</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Cui</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Du</surname> <given-names>H.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>A cation diffusion facilitator, GmCDF1, negatively regulates salt tolerance in soybean</article-title>. <source>PloS Genet.</source> <volume>15</volume>, <elocation-id>e1007798</elocation-id>. doi: <pub-id pub-id-type="doi">10.1371/journal.pgen.1007798</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>D.</given-names>
</name>
<name>
<surname>L&#xfc;</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Chu</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>Y.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>The genetic architecture of water-soluble protein content and its genetic relationship to total protein content in soybean</article-title>. <source>Sci. Rep-Uk</source> <volume>7</volume>, <fpage>5053</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-017-04685-7</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>W. K.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y. J.</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>G. Z.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>J. S.</given-names>
</name>
<name>
<surname>He</surname> <given-names>C. Y.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>X. L.</given-names>
</name>
<etal/>
</person-group>. (<year>2004</year>). <article-title>QTL mapping of ten agronomic traits on the soybean (<italic>Glycine max</italic> l. merr.) genetic map and their association with EST markers</article-title>. <source>Theor. Appl. Genet.</source> <volume>108</volume>, <fpage>1131</fpage>&#x2013;<lpage>1139</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00122-003-1527-2</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Zhen</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Yuan</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>A combined linkage and gwas analysis identifies QTLs linked to soybean seed protein and oil content</article-title>. <source>Int. J. Mol. Sci.</source> <volume>20</volume>, <fpage>5915</fpage>. doi: <pub-id pub-id-type="doi">10.3390/ijms20235915</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Cui</surname> <given-names>X.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>GmAOC4 modulates seed germination by regulating JA biosynthesis in soybean</article-title>. <source>Theor. Appl. Genet.</source> <volume>135</volume>, <fpage>439</fpage>&#x2013;<lpage>447</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00122-021-03974-0</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Cui</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Comparative selective signature analysis and high-resolution GWAS reveal a new candidate gene controlling seed weight in soybean</article-title>. <source>Theor. Appl. Genet.</source> <volume>134</volume>, <fpage>1329</fpage>&#x2013;<lpage>1341</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00122-021-03774-6</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Gou</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Lyu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>W.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>Resequencing 302 wild and cultivated accessions identifies genes related to domestication and improvement in soybean</article-title>. <source>Nat. Biotechnol.</source> <volume>33</volume>, <fpage>125</fpage>&#x2013;<lpage>408</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nbt.3096</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>