<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fgene.2021.612492</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Genotyping and Whole-Genome Resequencing of Welsh Sheep Breeds Reveal Candidate Genes and Variants for Adaptation to Local Environment and Socioeconomic Traits</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Sweet-Jones</surname> <given-names>James</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1325704/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Lenis</surname> <given-names>Vasileios Panagiotis</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1323763/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Yurchenko</surname> <given-names>Andrey A.</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/817669/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Yudin</surname> <given-names>Nikolay S.</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/142845/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Swain</surname> <given-names>Martin</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/636474/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Larkin</surname> <given-names>Denis M.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/580417/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Royal Veterinary College, University of London</institution>, <addr-line>London</addr-line>, <country>United Kingdom</country></aff>
<aff id="aff2"><sup>2</sup><institution>Institute of Biological, Environmental and Rural Sciences, University of Aberystwyth</institution>, <addr-line>Aberystwyth</addr-line>, <country>United Kingdom</country></aff>
<aff id="aff3"><sup>3</sup><institution>School of Health and Life Sciences, Teesside University</institution>, <addr-line>Middlesbrough</addr-line>, <country>United Kingdom</country></aff>
<aff id="aff4"><sup>4</sup><institution>The Federal Research Center Institute of Cytology and Genetics, The Siberian Branch of the Russian Academy of Sciences (ICG SB RAS)</institution>, <addr-line>Novosibirsk</addr-line>, <country>Russia</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Anastasia Anashkina, Engelhardt Institute of Molecular Biology (RAS), Russia</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Qianjun Zhao, Chinese Academy of Agricultural Sciences (CAAS), China; Siroj Bakoev, Centre for Strategic Planning and Management of Biomedical Health, Russia; Jianlin Han, International Livestock Research Institute (ILRI), Kenya</p></fn>
<corresp id="c001">&#x002A;Correspondence: Denis M. Larkin, <email>dmlarkin@gmail.com</email></corresp>
<fn fn-type="other" id="fn004"><p>This article was submitted to Computational Genomics, a section of the journal Frontiers in Genetics</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>18</day>
<month>06</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>12</volume>
<elocation-id>612492</elocation-id>
<history>
<date date-type="received">
<day>30</day>
<month>09</month>
<year>2020</year>
</date>
<date date-type="accepted">
<day>10</day>
<month>05</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2021 Sweet-Jones, Lenis, Yurchenko, Yudin, Swain and Larkin.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Sweet-Jones, Lenis, Yurchenko, Yudin, Swain and Larkin</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<sec><title>Background</title>
<p>Advances in genetic tools applied to livestock breeding has prompted research into the previously neglected breeds adapted to harsh local environments. One such group is the Welsh mountain sheep breeds, which can be farmed at altitudes of 300 m above sea level but are considered to have a low productive value because of their poor wool quality and small carcass size. This is contrary to the lowland breeds which are more suited to wool and meat production qualities, but do not fare well on upland pasture. Herein, medium-density genotyping data from 317 individuals representing 15 Welsh sheep breeds were used alongside the whole-genome resequencing data of 14 breeds from the same set to scan for the signatures of selection and candidate genetic variants using haplotype- and SNP-based approaches.</p></sec>
<sec><title>Results</title>
<p>Haplotype-based selection scan performed on the genotyping data pointed to a strong selection in the regions of <italic>GBA3</italic>, <italic>PPARGC1A</italic>, <italic>APOB</italic>, and <italic>PPP1R16B</italic> genes in the upland breeds, and <italic>RNF24</italic>, <italic>PANK2</italic>, and <italic>MUC15</italic> in the lowland breeds. SNP-based selection scan performed on the resequencing data pointed to the missense mutations under putative selection relating to a local adaptation in the upland breeds with functions such as angiogenesis (<italic>VASH1</italic>), anti-oxidation (<italic>RWDD1</italic>), cell stress (<italic>HSPA5</italic>), membrane transport (<italic>ABCA13</italic> and <italic>SLC22A7</italic>), and insulin signaling (<italic>PTPN1</italic> and <italic>GIGFY1</italic>). By contrast, genes containing candidate missense mutations in the lowland breeds are related to cell cycle (<italic>CDK5RAP2</italic>), cell adhesion (<italic>CDHR3</italic>), and coat color (<italic>MC1R</italic>).</p></sec>
<sec><title>Conclusion</title>
<p>We found new variants in genes with potentially functional consequences to the adaptation of local sheep to their environments in Wales. Knowledge of these variations is important for improving the adaptative qualities of UK and world sheep breeds through a marker-assisted selection.</p></sec>
</abstract>
<kwd-group>
<kwd>sheep</kwd>
<kwd>signatures of selection</kwd>
<kwd>Wales</kwd>
<kwd>whole-genome resequencing</kwd>
<kwd>adaptation</kwd>
</kwd-group>
<contract-sponsor id="cn001">Russian Science Foundation<named-content content-type="fundref-id">10.13039/501100006769</named-content></contract-sponsor>
<counts>
<fig-count count="3"/>
<table-count count="3"/>
<equation-count count="0"/>
<ref-count count="80"/>
<page-count count="13"/>
<word-count count="0"/>
</counts>
</article-meta>
</front>
<body>
<sec id="S1">
<title>Introduction</title>
<p>Since the domestication in the semi-arid Fertile Crescent of Iran and Turkey, sheep (<italic>Ovis aries</italic>) have undergone migration and selection to form established breeds that are well-suited to various local environments (<xref ref-type="bibr" rid="B80">Zeder, 2008</xref>). The process of natural or artificial positive/negative selection results in genomic regions of a decreased diversity, which are known as the signatures of selection (<xref ref-type="bibr" rid="B36">Kijas et al., 2012</xref>). Detecting signatures of selection is important for understanding the genetic mechanisms of the adaptation of breeds to their local environments. Previous investigations have unearthed genes relating to hypoxia in sheep adapted to high altitudes on the Qinghai-Tibetan Plateau of China (<italic>THRB</italic>) (<xref ref-type="bibr" rid="B77">Yang et al., 2016</xref>), fat deposition in sheep from arid deserts of northern Africa (<italic>PCDH9</italic>) (<xref ref-type="bibr" rid="B37">Kim et al., 2016</xref>), and metabolism in Russian sheep adapted to low temperatures (<italic>POMC</italic>) (<xref ref-type="bibr" rid="B79">Yurchenko et al., 2019</xref>). Whilst these examples represent the extreme circumstances, there are examples of selection in sheep adapted to more temperate climates. For instance, three upland sheep breeds from northern England were shown to demonstrate higher than expected frequencies of the known missense mutations in genes associated with reproductive success (<italic>PRLP</italic>) and presence of horns (<italic>RXFP2</italic>) (<xref ref-type="bibr" rid="B14">Bowles et al., 2014</xref>). Knowledge of such selection is essential for the continued improvement of breeds better suited to their environments and with a better socioeconomic trait potential in current selection programs, which is particularly pressing in terms of climate change (<xref ref-type="bibr" rid="B13">Bowles, 2015</xref>). Here, we investigated another example of previously neglected breeds adapted to local environments in Wales, United Kingdom, where sheep have historically been farmed at altitudes of &#x003E;1,000 feet (&#x223C;300 m) above sea level on a rough pasture with shallow-rooted plants (<xref ref-type="bibr" rid="B18">Davies, 1935</xref>).</p>
<p>Sheep were introduced to Wales by Neolithic settlers, bringing a primitive breed similar to the contemporary Soay (6,000 years ago) with two likely further introductions by Roman white-faced, fine-wool breeds (2,000 years ago) and Norse black-faced breeds (1,000 years ago) (<xref ref-type="bibr" rid="B61">Ryder, 1964</xref>). The South Wales Welsh Mountain (SWWM) breed of today, a descendent of the Roman and Soay breeds, has been documented since the 16th century and is renowned for its hardiness, lambing ability, and sweet meat taste. Despite this potential economic gain, these mountain sheep suffer a trade-off to a kemp wool and small carcass size, leading them to be poorly exploited outside of Wales (<xref ref-type="bibr" rid="B74">Williams-Davies, 1981</xref>). To overcome this, the SWWM breed was cross-bred in the eighteenth century to form a number of more productive local breeds, which are now farmed on the lowlands (<xref ref-type="bibr" rid="B61">Ryder, 1964</xref>; <xref ref-type="bibr" rid="B74">Williams-Davies, 1981</xref>).</p>
<p>Previous work to reveal the population history of Welsh sheep showed that Welsh breeds clustered closely with each other based on haplotype sharing, forming two groups within this cluster, which aligned with the upland or lowland farming style. Exceptions to this were the Black Welsh Mountain (BWM) and Kerry Hill with Beulah, which remained distinct from all other breeds (<xref ref-type="bibr" rid="B8">Beynon et al., 2015</xref>). This distinction of BWM is supportive of the alternate ancestry from Norse breeds and deliberate selection based on coat color (<xref ref-type="bibr" rid="B74">Williams-Davies, 1981</xref>). Moreover, the divergence of Kerry Hill and Beulah may be the result of a genetic bottleneck or a founder effect that these breeds underwent. Additional support of this can be seen in the low effective population sizes and high inbreeding coefficients of these breeds (<xref ref-type="bibr" rid="B8">Beynon et al., 2015</xref>). Low effective population sizes endanger these breeds to risks of increased homozygosity and lack of genetic diversity due to inbreeding. This is a potential risk for UK upland sheep breeds who have remained geographically and genetically isolated due to their adaptability to thrive on pastures that other breeds cannot (<xref ref-type="bibr" rid="B14">Bowles et al., 2014</xref>; <xref ref-type="bibr" rid="B30">Heaton et al., 2014</xref>).</p>
<p>With this in mind, it is important, from a perspective of cultural significance, breed conservation, and breed improvement, to study the adaptation of Welsh breeds, which potentially offers insight into genomic adaption to upland farming, as well as lambing and meat quality. Likewise, lowland productive breeds offer a good comparison due to their stronger capabilities for traits related to socioeconomic gain. Through the use of a commercially available medium-density SNP genotyping array with a HapFLK and Decorrelated Composite of Multiple Statistics (DCMS) software and whole-genome resequencing data with a DCMS pipeline, this paper aims to identify the signatures of selection in the genomes of Welsh sheep breeds and candidate genes containing functional missense mutations in these regions.</p>
</sec>
<sec id="S2" sec-type="materials|methods">
<title>Materials and Methods</title>
<sec id="S2.SS1">
<title>Data Source and Variant Calling</title>
<p>Genotyping data from 353 individuals across 18 Welsh breeds on the Illumina OvineSNP50 SNP array from <xref ref-type="bibr" rid="B8">Beynon et al. (2015)</xref> were used in this study. Illumina pair-ended read (150 bp) resequencing of 11 Welsh sheep samples from the same set, representing one sample per breed (<xref ref-type="supplementary-material" rid="SM2">Supplementary Table 1</xref>), was performed at the University of Aberystwyth to &#x223C;13&#x00D7; raw coverage using Illumina HiSeq according to the manufacturer&#x2019;s protocol. Three remaining Welsh sheep resequenced genomes for Welsh Hardy-Speckled Faced, Dolgellau Welsh Mountain, and Talybont Welsh Mountain were downloaded from the National Centre for Biotechnology Information Sequence Read Archive, PRJNA160933 (<xref ref-type="bibr" rid="B30">Heaton et al., 2014</xref>). A dataset of resequenced Russian sheep samples (<italic>n</italic> = 40) adapted to a contrasting environment was used as an outgroup in this study (<xref ref-type="bibr" rid="B64">Sweet-Jones et al., 2021</xref>).</p>
<p>Reads were mapped by using the Burrows-Wheeler Aligner BWA-MEM (BWA V.0.7.10 (<xref ref-type="bibr" rid="B42">Li, 2013</xref>) to the reference sheep genome Oar_V.3.1. Reads were sorted using the Samtools V.0.1.18 (<xref ref-type="bibr" rid="B43">Li et al., 2009</xref>) and duplicates were marked with the Picard V.2.18<sup><xref ref-type="fn" rid="footnote1">1</xref></sup>. Libraries were also merged using Picard. Base Quality Score Recalibration (BQSR) was performed, which account for the systematic errors in sequencing, using the Genome Analysis Toolkit (GATK V.3.8; <xref ref-type="bibr" rid="B50">McKenna et al., 2010</xref>). Samples then underwent variant calling with the GATK HaplotypeCaller function. Finally, all samples (<italic>n</italic> = 54) underwent joint calling to merge all reported variants into a single vcf file. Following this, hard filtering for quality scores assigned by BQSR was performed by GATK, using the filter expression &#x201C;[QD &#x003C; 2.0| | FS &#x003E; 60.00| | MQ &#x003C; 40.00| | MQRankSum &#x003C; &#x2212;12.5| | ReadPosRankSum &#x003C; &#x2212;8.0].&#x201D; All variants from resequenced data were converted into a Plink V.1.90 (<xref ref-type="bibr" rid="B59">Purcell et al., 2007</xref>) format to be run through the DCMS pipeline (<xref ref-type="bibr" rid="B79">Yurchenko et al., 2019</xref>).</p>
</sec>
<sec id="S2.SS2">
<title>HapFLK Statistics</title>
<p>Welsh breed genotyping data were separated into three groups of related breeds based on the clustering analysis performed by <xref ref-type="bibr" rid="B8">Beynon et al. (2015)</xref>, resulting in one group of upland breeds and two groups of lowland breeds. Of the two lowland groups, one consisted of five lowland breeds and the other consisted of only the Kerry Hill and Beulah breeds (KHB) (<xref ref-type="table" rid="T1">Table 1</xref>). Plink-formatted (<xref ref-type="bibr" rid="B59">Purcell et al., 2007</xref>) files for the upland and lowland breed groups had genotypes from the sex chromosomes removed and were filtered to remove the rare alleles [&#x2013;maf 0.05], low called SNPs [&#x2013;geno 0.01], or poorly genotyped individuals [&#x2013;mind 0.05]. FastPhase V.1.4 (<xref ref-type="bibr" rid="B62">Scheet and Stephens, 2006</xref>) was used to estimate the number of haplotype clusters (k) for each group (Lowland k = 48, KHB k = 25, and Upland k = 53). HapFLK software (<xref ref-type="bibr" rid="B10">Bonhomme et al., 2010</xref>) was used to obtain selection statistics for each group. This test uses the hierarchal population structure to identify the haplotype-based selective sweeps, which focuses on the inherited combinations of alleles. It has the advantage of an increased statistical power, reliably detecting the hard and soft selective sweeps, and is a realistic simulation of selection through the haplotypes. HapFLK <italic>p</italic>-values were calculated using the Python script scaling_chi2_hapflk.py (<xref ref-type="bibr" rid="B10">Bonhomme et al., 2010</xref>; <xref ref-type="bibr" rid="B22">Fariello et al., 2013</xref>). Adjusted <italic>p</italic>-values, or <italic>q</italic>-values, were calculated through the R qqman <italic>q</italic>-value function (<xref ref-type="bibr" rid="B69">Turner, 2014</xref>). Selected intervals were determined by boundaries of <italic>q</italic> &#x003C; 0.05 with SNPs within an interval of <italic>q</italic> &#x003C; 0.01 considered to be under a strong selection.</p>
<table-wrap position="float" id="T1">
<label>TABLE 1</label>
<caption><p>Breed representation in the genotyping and resequencing datasets.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Breed</td>
<td valign="top" align="center">Abbreviation</td>
<td valign="top" align="center">Genotyped samples</td>
<td valign="top" align="center">Horns</td>
<td valign="top" align="left">Base color</td>
<td valign="top" align="center">Fleece</td>
<td valign="top" align="left">HapFLK group</td>
<td valign="top" align="left">Resequencing group</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Badger Faced Welsh Mountain</td>
<td valign="top" align="center">BFWM</td>
<td valign="top" align="center">21</td>
<td valign="top" align="center">Yes</td>
<td valign="top" align="left">Black and white</td>
<td valign="top" align="center">Firm</td>
<td valign="top" align="left">Upland</td>
<td valign="top" align="left">NA&#x002A;</td>
</tr>
<tr>
<td valign="top" align="left">Balwen</td>
<td valign="top" align="center">&#x2212;</td>
<td valign="top" align="center">14</td>
<td valign="top" align="center">No</td>
<td valign="top" align="left">Black and white</td>
<td valign="top" align="center">Firm</td>
<td valign="top" align="left">Upland</td>
<td valign="top" align="left">Upland</td>
</tr>
<tr>
<td valign="top" align="left">Beulah</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">22</td>
<td valign="top" align="center">No</td>
<td valign="top" align="left">Black and white</td>
<td valign="top" align="center">Fine</td>
<td valign="top" align="left">KHB</td>
<td valign="top" align="left">Lowland</td>
</tr>
<tr>
<td valign="top" align="left">Black Welsh Mountain</td>
<td valign="top" align="center">BWM</td>
<td valign="top" align="center">24</td>
<td valign="top" align="center">Yes</td>
<td valign="top" align="left">Black</td>
<td valign="top" align="center">Firm</td>
<td valign="top" align="left">Upland</td>
<td valign="top" align="left">Upland</td>
</tr>
<tr>
<td valign="top" align="left">Brecknock Hill Cheviot</td>
<td valign="top" align="center">BHC</td>
<td valign="top" align="center">24</td>
<td valign="top" align="center">No</td>
<td valign="top" align="left">White</td>
<td valign="top" align="center">Fine</td>
<td valign="top" align="left">Upland</td>
<td valign="top" align="left">Upland</td>
</tr>
<tr>
<td valign="top" align="left">Clun Forest</td>
<td valign="top" align="center">&#x2212;</td>
<td valign="top" align="center">17</td>
<td valign="top" align="center">No</td>
<td valign="top" align="left">Black</td>
<td valign="top" align="center">Fine</td>
<td valign="top" align="left">Lowland</td>
<td valign="top" align="left">Lowland</td>
</tr>
<tr>
<td valign="top" align="left">Dolgellau Welsh Mountain</td>
<td valign="top" align="center">DWM</td>
<td valign="top" align="center">&#x2212;</td>
<td valign="top" align="center">Yes</td>
<td valign="top" align="left">White</td>
<td valign="top" align="center">Firm</td>
<td valign="top" align="left">NA&#x002A;</td>
<td valign="top" align="left">Upland</td>
</tr>
<tr>
<td valign="top" align="left">Hardy Speckled Faced</td>
<td valign="top" align="center">HSF</td>
<td valign="top" align="center">24</td>
<td valign="top" align="center">Yes</td>
<td valign="top" align="left">White</td>
<td valign="top" align="center">Fine</td>
<td valign="top" align="left">Lowland</td>
<td valign="top" align="left">Lowland</td>
</tr>
<tr>
<td valign="top" align="left">Hill Radnor</td>
<td valign="top" align="center">&#x2212;</td>
<td valign="top" align="center">21</td>
<td valign="top" align="center">No</td>
<td valign="top" align="left">Gray-brown</td>
<td valign="top" align="center">Fine</td>
<td valign="top" align="left">Lowland</td>
<td valign="top" align="left">Lowland</td>
</tr>
<tr>
<td valign="top" align="left">Kerry Hill</td>
<td valign="top" align="center">&#x2212;</td>
<td valign="top" align="center">18</td>
<td valign="top" align="center">No</td>
<td valign="top" align="left">White</td>
<td valign="top" align="center">Fine</td>
<td valign="top" align="left">KHB</td>
<td valign="top" align="left">Lowland</td>
</tr>
<tr>
<td valign="top" align="left">Llandovery White Faced</td>
<td valign="top" align="center">LWF</td>
<td valign="top" align="center">24</td>
<td valign="top" align="center">No</td>
<td valign="top" align="left">White</td>
<td valign="top" align="center">Fine</td>
<td valign="top" align="left">Upland</td>
<td valign="top" align="left">Upland</td>
</tr>
<tr>
<td valign="top" align="left">Llanwenog</td>
<td valign="top" align="center">&#x2212;</td>
<td valign="top" align="center">21</td>
<td valign="top" align="center">No</td>
<td valign="top" align="left">Black</td>
<td valign="top" align="center">Fine</td>
<td valign="top" align="left">Lowland</td>
<td valign="top" align="left">Lowland</td>
</tr>
<tr>
<td valign="top" align="left">Lleyn</td>
<td valign="top" align="center">&#x2212;</td>
<td valign="top" align="center">22</td>
<td valign="top" align="center">No</td>
<td valign="top" align="left">White</td>
<td valign="top" align="center">Fine</td>
<td valign="top" align="left">Lowland</td>
<td valign="top" align="left">Lowland</td>
</tr>
<tr>
<td valign="top" align="left">South Wales Welsh Mountain</td>
<td valign="top" align="center">SWWM</td>
<td valign="top" align="center">17</td>
<td valign="top" align="center">Yes</td>
<td valign="top" align="left">White</td>
<td valign="top" align="center">Firm</td>
<td valign="top" align="left">Upland</td>
<td valign="top" align="left">Upland</td>
</tr>
<tr>
<td valign="top" align="left">Talybont Welsh Mountain</td>
<td valign="top" align="center">TWM</td>
<td valign="top" align="center">24</td>
<td valign="top" align="center">No</td>
<td valign="top" align="left">White</td>
<td valign="top" align="center">Firm</td>
<td valign="top" align="left">Upland</td>
<td valign="top" align="left">Upland</td>
</tr>
<tr>
<td valign="top" align="left">Welsh Mountain Hill Flock</td>
<td valign="top" align="center">WMHF</td>
<td valign="top" align="center">24</td>
<td valign="top" align="center">Yes</td>
<td valign="top" align="left">White</td>
<td valign="top" align="center">Firm</td>
<td valign="top" align="left">Upland</td>
<td valign="top" align="left">NA</td>
</tr>
<tr>
<td valign="top" align="left">Average/Total</td>
<td valign="top" align="center">&#x2212;</td>
<td valign="top" align="center">21/317</td>
<td valign="top" align="center">No</td>
<td valign="top" align="left">&#x2212;</td>
<td valign="top" align="center">&#x2212;</td>
<td valign="top" align="left">102/40/173</td>
<td valign="top" align="left">7/7</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<attrib><italic>&#x002A;NA denotes the exclusion of breed from either the HapFLK or resequencing study due to the unavailability of samples.</italic></attrib>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="S2.SS3">
<title>De-correlated Composite of Multiple Signals (DCMS)</title>
<p>Five established measures of selection and genetic diversity were both used on the genotyping (15 breeds) and whole genome resequencing (upland breeds <italic>n</italic> = 7; lowland breeds = 7) datasets as a DCMS (<xref ref-type="table" rid="T1">Table 1</xref>; <xref ref-type="bibr" rid="B48">Ma et al., 2015</xref>). Statistics used were: (i/ii) <italic>H2</italic>/<italic>H1</italic> and <italic>H12</italic>, which can distinguish the hard and soft selective sweeps by measuring the intensity of selection (<xref ref-type="bibr" rid="B25">Garud et al., 2015</xref>); (iii) Tajima&#x2019;s <italic>D</italic> comparing pairwise sequence differences and the number of segregating sites, detecting positive, negative, or balancing selection (<xref ref-type="bibr" rid="B65">Tajima, 1989</xref>); (iv) nucleotide diversity (<italic>Pi</italic>), average number of nucleotide differences between two sequences (<xref ref-type="bibr" rid="B53">Nei and Li, 1979</xref>); (v) <italic>F</italic><sub><italic>ST</italic></sub> fixation index, comparing single SNP frequencies across a population (<xref ref-type="bibr" rid="B73">Weir and Cockerham, 1984</xref>). By weighting the result of each statistic and generating a combined score, regions that overlap in the analysis outcomes gain a stronger evidence to be a region under selection.</p>
</sec>
<sec id="S2.SS4">
<title>H2/H1 and H12</title>
<p>Autosomal SNPs were filtered for &#x2013;maf 0.0000001 &#x2013;geno 0.1 &#x2013;mind 0.1 by Plink. SNPs were then phased by chromosome using ShapeIt2 (<xref ref-type="bibr" rid="B20">Delaneau et al., 2011</xref>) with 400 states and an effective population size of 100. Phased chromosomes were split into appropriate groupings per chromosome using Plink and H2/H1, H12 were calculated using the H1_H12.py Python script (<xref ref-type="bibr" rid="B25">Garud et al., 2015</xref>). H2/H1 and H12 values were calculated in windows of 25 SNPs using a step size of one SNP following our previous study (<xref ref-type="bibr" rid="B79">Yurchenko et al., 2019</xref>).</p>
</sec>
<sec id="S2.SS5">
<title>Tajima&#x2019;s <italic>D</italic></title>
<p>Tajima&#x2019;s <italic>D</italic> for mutation index was calculated over the same intervals of 25 SNPs, whose lengths were calculated from the output of the H2/H1 and H12 statistics. Using the vcftools V.0.1.13 (<xref ref-type="bibr" rid="B17">Danecek et al., 2011</xref>), Tajima&#x2019;s D was calculated [&#x2013;TajimaD 900000000] for each chromosome per group/breed file per window. Output files were concatenated per group.</p>
</sec>
<sec id="S2.SS6">
<title>Fixation Index</title>
<p><italic>F</italic><sub><italic>ST</italic></sub> was calculated with Plink comparing each group to all others. All negative values were converted to zero, and data were smoothed with the R <italic>runmed</italic> function in windows of 31 SNPs.</p>
</sec>
<sec id="S2.SS7">
<title>Nucleotide Diversity</title>
<p>Plink-format file was split by chromosome per breed, and nucleotide diversity was calculated with the vcftools [&#x2013;site-pi] option. Data were then smoothed using the R <italic>runmed</italic> function in windows of 31 SNPs.</p>
</sec>
<sec id="S2.SS8">
<title>Combining Statistics With DCMS</title>
<p>Output files from individual statistics were sorted and joined by SNP id. Genome-wide <italic>p</italic>-values through ranking results of each statistic were calculated in the R MINOTAUR <italic>stat-to-p</italic>-value function specifying the one-tailed tests (H2/H1, H12, <italic>F</italic><sub><italic>ST</italic></sub>&#x2013;right tailed, Pi, and Tajima&#x2019;s D&#x2013;left tailed). Covariance matrix was constructed based on sampling 300,000 randomly sampled SNPs using the R <italic>CovNAMcd</italic> function where the alpha = 0.75. DCMS statistics were calculated using the <italic>DCMS</italic> function and fitted to a normal distribution to examine normality implemented by the R MASS <italic>rlm</italic> function. These fitted DCMS values were converted to <italic>p</italic>-values using <italic>pnorm</italic>, and adjusted for a false discovery rate with the <italic>qvalue</italic> function. <italic>Q</italic>-values were parsed to determine selection with region boundaries set at a <italic>q</italic> &#x003C; 0.2 and a threshold of <italic>q</italic> &#x003C; 0.01.</p>
</sec>
<sec id="S2.SS9">
<title>Candidate Gene Search</title>
<p>For the regions defined by our pipelines as being under selection, genes were identified using a list of 26,958 genes of the Oar_V.3.1 genome downloaded from Ensembl BioMart v.98. Within each selected region, genes were then ranked based on their distances to the most significant SNP of that region with the closest gene being the top-ranking. The top 10 highest ranking genes from each region underwent literature review for their previous associations to adaptation to local environments or socioeconomic traits in animals. Genes with established links to these traits were identified as candidate genes in this study.</p>
<p>In the resequencing study, all SNPs were annotated with NGS-SNP (<xref ref-type="bibr" rid="B27">Grant et al., 2011</xref>) to identify missense mutations. Only genes with missense mutations in the regions under selection were considered for literature review. Additionally, missense SNPs with a strong support from the <italic>F</italic><sub><italic>ST</italic></sub> statistic (<italic>F</italic><sub><italic>ST</italic></sub> &#x2265; 0.3) were analyzed with PolyPhen2 to predict their effects on protein structure and function (0 = benign and 1 = deleterious; <xref ref-type="bibr" rid="B1">Adzhubei et al., 2013</xref>).</p>
<p>Functional enrichment analysis was performed using the Database for Annotation, Visualization, and Integrated Discovery (DAVID) v. 6.8 (<xref ref-type="bibr" rid="B31">Huang et al., 2009</xref>) using the same gene list downloaded from Ensembl Biomart v. 98. Enrichments were detected using the DAVID functional clustering tool, which verifies enrichments of similar GO terms across many different databases, to confer a stronger evidence of enrichment. Scores &#x003E; 1.3-fold enrichment were considered.</p>
</sec>
<sec id="S2.SS10">
<title>Copy Number Variant (CNV) Analysis of Resequenced Genomes</title>
<p>CNV detection was performed to identify the regions in the genomes of Welsh sheep that had been duplicated or deleted with respect to the Texel reference genome. We identified CNVs in the resequenced samples with the cn.Mops R package (<xref ref-type="bibr" rid="B38">Klambauer et al., 2012</xref>) in a window length of 700 SNPs, using sequences that had undergone BQSR. This resulted in each individual being given a raw copy number (CN) per window. CN1&#x2013;CN3 were considered to be normal and discounted from the results. Raw CNVs were merged into the CNV Regions (CNVRs) with the BedOps <italic>bedmap</italic> function using at least 50% reciprocal overlap in at least three individuals within the same group as criteria for inclusion. Duplicate CNVRs were removed, and the neighboring CNVRs were merged. This allowed us to be confident in our results by excluding the regions where CNVRs appear to overlap the signatures of selection, as these cast doubt over their reliability.</p>
</sec>
<sec id="S2.SS11">
<title>Data Visualization</title>
<p>HapFLK clusterplots and haplotype trees were visualized from the prepared R scripts available (<xref ref-type="bibr" rid="B10">Bonhomme et al., 2010</xref>; <xref ref-type="bibr" rid="B22">Fariello et al., 2013</xref>). All Manhattan plots were rendered in R by the <italic>qqman</italic> package setting the suggestive line (<italic>q</italic> = 0.05) and genome-wide line (<italic>q</italic> = 0.01) to indicate selection. Haplostrips for visualization of haplotype sharing (<xref ref-type="bibr" rid="B49">Marnetto and Huerta-S&#x00E1;nchez, 2017</xref>) in the regions under selection detected by DCMS were run using phased data.</p>
</sec>
</sec>
<sec id="S3">
<title>Results</title>
<sec id="S3.SS1">
<title>Regions Under Selection Detected From Genotyping Data</title>
<p>Using the HapFLK software, signatures of selection were found in each grouping using 44,711 SNPs (lowland group contained one region, KHB-two, and upland-31; <xref ref-type="supplementary-material" rid="SM2">Supplementary Tables 2</xref>&#x2013;<xref ref-type="supplementary-material" rid="SM2">4</xref>). Cluster plots and Haplotype Trees for the most significantly selected regions in the KBH group are shown in <xref ref-type="fig" rid="F1">Figure 1</xref> and for other groups, in <xref ref-type="supplementary-material" rid="SM1">Supplementary Figure 1</xref>. Lengths of the regions found under selection ranged from 1.81 to 64.78 Mb with a median length of 7.33 Mb. Moreover, DCMS also found the regions under selection in all 15 breeds, with at least one region of a strong selection (<italic>q</italic> &#x003C; 0.01) in each breed using 47,366 SNPs. Lengths of the regions under selection ranged from 1 to 3.9 Mb where the median length of regions was 0.16 Mb. The number of regions detected in each breed ranged from 8 in Kerry Hill to 89 in Clun Forest (<xref ref-type="supplementary-material" rid="SM2">Supplementary Tables 5</xref>&#x2013;<xref ref-type="supplementary-material" rid="SM2">19</xref>). In these regions under selection, 1,089 unique genes were found, with 179 occurring in multiple breeds including: <italic>GBA3</italic> (Hill Radnor, LWF, Lleyn, SWWM, TWM, and WMHF), <italic>ENSOARG00000021104</italic> (BFWM, Clun Forest, Hill Radnor, and Lleyn), <italic>PCDH9</italic> (BHC, Hill Radnor, and Llanwenog), and <italic>PPARGCA1</italic> (LWF, SWWM, and WMHF). Manhattan plots for all the breeds investigated are shown in <xref ref-type="fig" rid="F2">Figure 2</xref> and <xref ref-type="supplementary-material" rid="SM1">Supplementary Figure 2</xref>.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p>Output of genomic regions under strong selection in the KHB group from the HapFLK study. This includes the Manhattan plot <bold>(A)</bold> with a gene proximal to the most significant SNP of the highly selected peaks. Cluster plot <bold>(B)</bold> shows the tracks of haplotype diversity for the peak highlighted on the Manhattan plot by black borders where the red line represents the most significant SNP.</p></caption>
<graphic xlink:href="fgene-12-612492-g001.tif"/>
</fig>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>Manhattan plots of Llandovery White-faced <bold>(A)</bold> and South Wales Welsh Mountain <bold>(B)</bold> genotyped breeds&#x2019; DCMS output. All other breeds are shown in <xref ref-type="supplementary-material" rid="SM1">Supplementary Figure 2</xref>. Selection thresholds for a suggestive (<italic>q</italic> &#x003C; 0.05) and strong (<italic>q</italic> &#x003C; 0.01) selection shown by blue and red lines, respectively. Significant selection peaks have been annotated with the name of the top-ranked gene of that region.</p></caption>
<graphic xlink:href="fgene-12-612492-g002.tif"/>
</fig>
<p>There was a substantial overlap between the results for a region found on OAR6: 31.99&#x2013;46.00 Mb (<italic>q</italic> = 2.0 &#x00D7; 10<sup>&#x2013;5</sup>) in the upland breeds in the HapFLK study to a narrower region, OAR6: 40.20&#x2013;43.38 Mb, in LWF (<italic>q</italic> = 6.9 &#x00D7; 10<sup>&#x2013;15</sup>), WMHF (<italic>q</italic> = 4.3 &#x00D7; 10<sup>&#x2013;11</sup>), and SWWM (<italic>q</italic> = 8.73 &#x00D7; 10<sup>&#x2013;5</sup>). In all cases, the top ranked genes were <italic>GBA3</italic> linked to liver metabolism (<xref ref-type="bibr" rid="B19">Dekker et al., 2011</xref>) and <italic>PPARGC1A</italic> with known roles in mitochondrial biogenesis, fat deposition, and milk fatty acid composition in cattle (<xref ref-type="bibr" rid="B24">Fernandez-Marcos and Auwerx, 2011</xref>; <xref ref-type="bibr" rid="B2">Armstrong et al., 2018</xref>; <xref ref-type="bibr" rid="B78">Yuan et al., 2019</xref>; <xref ref-type="bibr" rid="B41">Li et al., 2016</xref>). On the HapFLK cluster plot for this region, low diversity was seen in the Balwen, BWM, LWF, and SWWM breeds, further supporting the idea of selection for this region. When plotted on a haplotype tree, it can be seen that Balwen had the longest branch compared to the other upland breeds, whilst the strongest signature of selection is seen in SWWM (<xref ref-type="supplementary-material" rid="SM1">Supplementary Figure 1</xref>).</p>
<p>Several other candidate regions detected by HapFLK overlapped with the regions found in the Welsh breeds by DCMS. OAR3: 23.23&#x2013;33.86 Mb (<italic>q</italic> = 5.0 &#x00D7; 10<sup>&#x2013;6</sup>) shared its top-ranked genes, <italic>TDRD15</italic> and <italic>APOB</italic>, with a region under selection in the upland Balwen breed (<italic>q</italic> = 0.0003). These genes are associated with cholesterol mobilization in Large White pigs (<xref ref-type="bibr" rid="B12">Bovo et al., 2019</xref>). OAR7: 47.55&#x2013;54.20 Mb (<italic>q</italic> = 0.0008) overlapped with another region OAR7: 51.30&#x2013;52.76 Mb in the upland BWM (<italic>q</italic> = 5.0 &#x00D7; 10<sup>&#x2013;9</sup>), but these did not share the top-ranked genes. Strong overlapping candidate genes are presented in <xref ref-type="table" rid="T2">Table 2</xref>.</p>
<table-wrap position="float" id="T2">
<label>TABLE 2</label>
<caption><p>Candidate genomic regions and genes from the HapFLK analysis and corresponding DCMS region.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">OAR</td>
<td valign="top" align="left">Region start</td>
<td valign="top" align="left">Region end</td>
<td valign="top" align="center">Group</td>
<td valign="top" align="left"><italic>q</italic>-value</td>
<td valign="top" align="left">Candidate genes (rank)</td>
<td valign="top" align="left">Function</td>
<td valign="top" align="center">Overlapping DCMS result</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">1</td>
<td valign="top" align="left">258,588,662</td>
<td valign="top" align="left">275,499,089</td>
<td valign="top" align="center">Upland</td>
<td valign="top" align="left">0.0002</td>
<td valign="top" align="left"><italic>SIM2(1), CLDN14(2)</italic></td>
<td valign="top" align="justify"/>
<td valign="top" align="justify"/>
</tr>
<tr>
<td valign="top" align="left">3</td>
<td valign="top" align="left">23,229,012</td>
<td valign="top" align="left">33,863,536</td>
<td valign="top" align="center">Upland</td>
<td valign="top" align="left">4.0&#x00A0;&#x00D7;&#x00A0;10<sup>&#x2013;6</sup></td>
<td valign="top" align="left"><italic>TDRD15(1), APOB(2)</italic></td>
<td valign="top" align="left">Cholesterol efflux</td>
<td valign="top" align="center">Balwen</td>
</tr>
<tr>
<td valign="top" align="left">6</td>
<td valign="top" align="left">31,991,037</td>
<td valign="top" align="left">45,997,407</td>
<td valign="top" align="center">Upland</td>
<td valign="top" align="left">1.0 &#x00D7; 10<sup>&#x2013;5</sup></td>
<td valign="top" align="left"><italic>GBA3(1), PPARGC1A(2), DHX15(3), SOD3(4), KCNIP4(6)</italic></td>
<td valign="top" align="left">Metabolism</td>
<td valign="top" align="center">LWF, WMHF, SWWM</td>
</tr>
<tr>
<td valign="top" align="left">10</td>
<td valign="top" align="left">35,062,152</td>
<td valign="top" align="left">51,872,705</td>
<td valign="top" align="center">KHB</td>
<td valign="top" align="left">8.0 &#x00D7; 10<sup>&#x2013;5</sup></td>
<td valign="top" align="left"><italic>KLHL1(1), PCDH9(2)</italic></td>
<td valign="top" align="left">Neurodevelopment, cell adhesion</td>
<td valign="top" align="justify"/>
</tr>
<tr>
<td valign="top" align="left">13</td>
<td valign="top" align="left">46,620,758</td>
<td valign="top" align="left">72,941,741</td>
<td valign="top" align="center">Upland</td>
<td valign="top" align="left">2.0 &#x00D7; 10<sup>&#x2013;6</sup></td>
<td valign="top" align="left"><italic>DHX35(1), PPP1R16B(3), ADIG(6)</italic></td>
<td valign="top" align="left">Innate immunity, angiogenesis</td>
<td valign="top" align="center">BFWM</td>
</tr>
<tr>
<td valign="top" align="left">13</td>
<td valign="top" align="left">47,164,400</td>
<td valign="top" align="left">54,366,328</td>
<td valign="top" align="center">Lowland</td>
<td valign="top" align="left">0.01</td>
<td valign="top" align="left"><italic>RNF24(1), PANK2(2), MAVS(3)</italic></td>
<td valign="top" align="left">Vision</td>
<td valign="top" align="center">HSF</td>
</tr>
<tr>
<td valign="top" align="left">15</td>
<td valign="top" align="left">32,152,675</td>
<td valign="top" align="left">65,710,885</td>
<td valign="top" align="center">Upland</td>
<td valign="top" align="left">4.0 &#x00D7; 10<sup>&#x2013;7</sup></td>
<td valign="top" align="left"><italic>MUC15(1), ANO3(3)</italic></td>
<td valign="top" align="left">Mucous production</td>
<td valign="top" align="justify"/>
</tr>
</tbody>
</table></table-wrap>
<p>The most strongly selected region in the HapFLK study was seen on OAR15 32.15&#x2013;72.10 Mb in the KHB lowland group, with the top-ranking gene being <italic>MUC15</italic> (<italic>q</italic> = 4.1 &#x00D7; 10<sup>&#x2013;7</sup>), associated with a low fecal egg count in Spanish Churra sheep during gastrointestinal parasite infections (<xref ref-type="bibr" rid="B56">Periasamy et al., 2014</xref>; <xref ref-type="bibr" rid="B6">Benavides et al., 2015</xref>). This was supported by a low haplotype diversity seen in the Kerry Hill breed at this locus, but this signature was not seen in Beulah or in the DCMS results in either breeds.</p>
<p>In the other lowland group, the only region found under selection, OAR13: 47.16&#x2013;54.37 Mb (<italic>q</italic> = 0.01), overlapped with another region found in the upland group, OAR13: 46.62&#x2013;72.94 Mb (<italic>q</italic> = 2.0 &#x00D7; 10<sup>&#x2013;6</sup>), but the top candidate genes were different. In the lowland breeds, the top-ranked genes were <italic>RNF24</italic> and <italic>PANK2</italic>, which have been found under selection in world sheep breeds in association to a loss of vision following domestication (<xref ref-type="bibr" rid="B52">Naval-Sanchez et al., 2018</xref>; <xref ref-type="bibr" rid="B70">Wang et al., 2019</xref>). Cluster plots for this region showed a decreased haplotype diversity amongst the selected region on OAR13 in the lowland breeds, especially Clun Forest and HSF. Furthermore, significant selection at this locus in HSF (<italic>q</italic> = 0.0006) was confirmed using the DCMS pipeline. In the case of the upland breeds, the top-ranked genes were <italic>DHX35</italic> and <italic>PPP1R16B</italic> which are related to innate viral immunity (<xref ref-type="bibr" rid="B60">Rahman et al., 2017</xref>) and endothelial cell proliferation (<xref ref-type="bibr" rid="B58">Pszczola et al., 2018</xref>), respectively.</p>
<p>The genes found within the regions under selection from HapFLK, functional enrichments seen for the KHB group included the DENN domain and connexin gap junctions, enriched 1.6- and 1.4-fold, respectively. The most highly enriched terms in the upland breeds were bactericidal permeability protein, major intrinsic protein, and semaphorins, which were all enriched over threefold. The most enriched cluster seen in the genotyping DCMS analysis was the Type II keratin filaments from the Hill Radnor breed, which was enriched fivefold. This was followed by the Ribonuclease A in Clun forest, enriched 2.8-fold and leucine rich-repeats in Lleyn, enriched 2.7-fold (<xref ref-type="supplementary-material" rid="SM2">Supplementary Table 20</xref>).</p>
</sec>
<sec id="S3.SS2">
<title>Signatures of Selection Detected From Resequencing Data</title>
<p>Fifty-four (14 Welsh and 40 Russian sheep) resequenced genomes were aligned to the Oar_V.3.1 genome with a mean filtered coverage of 11.9&#x00D7; (<xref ref-type="supplementary-material" rid="SM2">Supplementary Table 1</xref>). A total of 41,643,098 SNPs were called, which were pruned to 38,276,494 SNPs after filtering. CNVRs covered 0.27% of the lowland and 0.24% of the upland genomes, overlapping 852 and 669 genes, respectively (<xref ref-type="supplementary-material" rid="SM2">Supplementary Tables 21</xref>,<xref ref-type="supplementary-material" rid="SM2">22</xref>). Three CNVRs from the lowland breeds and 52 CNVRs from the upland breeds overlapped the regions of selection. Some of these CNVRs had a high frequency in the population, including the regions under a strong selection on OAR24 in the lowland breeds, spanning the <italic>CLCN7</italic> gene and on OAR17, whereas in the upland breeds, these spanned the <italic>IGLV4-69, ZNF280B</italic>, and <italic>PRAME</italic> genes.</p>
<p>After excluding the regions overlapping CNVRs, DCMS found 2,996 regions under selection in the Welsh breeds (lowland = 514, upland = 2,482; <xref ref-type="supplementary-material" rid="SM2">Supplementary Tables 23</xref>,<xref ref-type="supplementary-material" rid="SM2">24</xref> and <xref ref-type="fig" rid="F3">Figure 3A</xref>). These regions overlapped 104 and 430 genes in the lowland and upland breeds, respectively. The most significantly selected region in the upland group was OAR22: 15.3676&#x2013;15.3679 Mb, which overlapped the <italic>NOC3L</italic> gene (<italic>q</italic> = 1.8 &#x00D7; 10<sup>&#x2013;8</sup>), and for the lowland group, it was a single synonymous SNP located in <italic>MYH11</italic> (<italic>q</italic> = 0.0006).</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p><bold>(A)</bold> Manhattan plot of DCMS <italic>q</italic>-values of the lowland (yellow) and upland (blue) breeds showing missense mutations found under selection, highlighted in red with the corresponding gene names. Selection thresholds for a suggestive (<italic>q</italic> &#x003C; 0.05) and strong (<italic>q</italic> &#x003C; 0.01) selection shown by blue and red lines, respectively. Underlined gene names show selection in both the lowland and upland breeds. <bold>(B)</bold> Allele frequencies for missense mutations identified by a strong <italic>F</italic><sub><italic>ST</italic></sub> score represented by pie charts (green = reference allele, red = derived allele). This shows the location of missense mutations along their gene with nucleotide substitution highlighted by a red circle. Blue and yellow dotted lines point to the corresponding peak positions of the Manhattan plot. Amino acid substitution is shown, alongside the Polyphen score and <italic>q</italic>-value. <bold>(C)</bold> Haplostrip plots spanning genes containing the missense mutations but were selected on the basis of the H2/H1 and H12 haplotype statistics. Similar haplotypes are clustered together per population to demonstrate selection within these regions across the whole gene. These show the presence of reference (white) or derived (black) alleles making up different haplotypes. Populations of interest are highlighted in boxes corresponding to their colors on the Manhattan plot. &#x201C;&#x2756;&#x201D; is used to denote genes under selection by DCMS and HapFLK.</p></caption>
<graphic xlink:href="fgene-12-612492-g003.tif"/>
</fig>
</sec>
<sec id="S3.SS3">
<title>Identification of Candidate Genes and Missense Mutations</title>
<p>In regions under selection, there were 12 missense mutations found in the lowland breeds (<xref ref-type="supplementary-material" rid="SM2">Supplementary Table 25</xref>) and 85 missense mutations found in the upland breeds (<xref ref-type="supplementary-material" rid="SM2">Supplementary Table 26</xref>). Of these, only missense mutations and their enclosing genes, which were top-ranking SNPs in their selected intervals are discussed below, leading to a total of 4 in the lowland breeds and 14 in the upland breeds. Clarification of the type of selection relied on a strong support from the <italic>H2/H1</italic> and <italic>H12</italic> statistics, which were considered to be haplotype-based selection, or <italic>F</italic><sub><italic>ST</italic></sub>, which was considered fixation of a variant in a population and was seen as a selection acting on individual SNPs.</p>
<p>Three missense mutations were found in the regions under selection (<italic>q</italic> &#x003C; 0.01), with a strong support from the <italic>F</italic><sub><italic>ST</italic></sub> statistic (<italic>F</italic><sub><italic>ST</italic></sub> &#x2265; 0.3). In the lowland breeds, these included the reference alleles of OAR2:2,887,916 in the <italic>CDK5RAP2</italic> gene (<italic>q</italic> = 0.006; <italic>F</italic><sub><italic>ST</italic></sub> = 0.3) and OAR4:47,087,846 in <italic>CDHR3</italic> (<italic>q</italic> = 0.007; <italic>F</italic><sub><italic>S</italic></sub><sub><italic>T</italic></sub> = 0.3). For the upland breeds, only one missense mutation was found, relating to the derived allele of OAR8:21,197,663 in the <italic>RWDD1</italic> gene (<italic>q</italic> = 0.002; <italic>F</italic><sub><italic>ST</italic></sub> = 0.5). The Polyphen score of this selected mutation, L23P, was low and did not support the large change in the protein function (<xref ref-type="fig" rid="F3">Figure 3B</xref>).</p>
<p>Missense SNPs in the regions under selection supported by the haplotype statistics (<italic>H2/H1</italic>, <italic>H12</italic>) were only found in the <italic>MC1R</italic> gene in the lowland breeds, and in the upland breeds: <italic>FGD3</italic>, <italic>HSPA5</italic>, <italic>ABCA13</italic>, <italic>PTPN1</italic>, <italic>ACP2</italic>, <italic>LOC101121718</italic>, <italic>NOC3L</italic>, <italic>VASH1</italic>, <italic>SIRPA</italic>, and <italic>UBA52</italic> genes. Alternatively, some missense SNPs received strong support from Tajima&#x2019;s <italic>D</italic> and <italic>Pi</italic>, including one in the <italic>GIGYF1</italic> gene found in the selected regions in both the upland and lowland breeds, as well as the <italic>SLC22A7</italic> and <italic>HSD3B7</italic> genes in the upland breeds (<xref ref-type="fig" rid="F3">Figure 3C</xref>).</p>
<p>In the upland breeds, three of the genes found with missense SNPs were also identified in the regions under selection defined in the upland breeds of the genotyping analysis. These included: <italic>VASH1</italic> (<italic>q</italic> = 0.003) on OAR7, which also overlapped with BWM from the genotyping DCMS data; <italic>UBA52</italic> (<italic>q</italic> = 0.01) on OAR13, which also overlapped with BHC from the genotyping data, and <italic>SIRPA</italic> (<italic>q</italic> = 0.007). No missense mutations found in the lowland breeds overlapped with the regions under selection detected from the genotyping dataset.</p>
</sec>
<sec id="S3.SS4">
<title>Candidate Genes in Welsh Lowland Sheep Breeds</title>
<p><italic>MC1R</italic>, found in a region under selection in the lowland breeds (<xref ref-type="table" rid="T3">Table 3</xref>), is known to cause an upregulation of tyrosinase in hair melanocytes, which led to an increase of black eumelanin pigment; however, in sheep, typically, white pheomelanin is produced due to selection for mutations in <italic>MC1R</italic> (<xref ref-type="bibr" rid="B71">Weatherhead and Logan, 1981</xref>; <xref ref-type="bibr" rid="B76">Yang et al., 2013</xref>). Another gene, <italic>CDK5RAP2</italic>, with a strong support from allele frequency statistics, is related to human neurodevelopment by recruiting tubulin subunits, which are important for cortical gyration (<xref ref-type="bibr" rid="B33">Issa et al., 2013</xref>). Mutations in this gene have also been linked to Hertwig&#x2019;s anemia mutant mouse models displaying blood cytopenia, aneuploidy due to impaired cell-cycle spindle checkpoints, and increased neuronal cell death (<xref ref-type="bibr" rid="B47">Lizarraga et al., 2010</xref>). Finally, <italic>CDHR3</italic>, encoding a cell adhesion protein is linked to childhood asthma and rhinovirus-C susceptibility, was also located in a region under selection in Asian sheep by HapFLK (<xref ref-type="bibr" rid="B23">Fariello et al., 2014</xref>; <xref ref-type="bibr" rid="B9">Bochkov et al., 2015</xref>).</p>
<table-wrap position="float" id="T3">
<label>TABLE 3</label>
<caption><p>Candidate genes and missense mutations in the lowland and upland sheep breeds.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">OAR</td>
<td valign="top" align="left">Region start</td>
<td valign="top" align="left">Region end</td>
<td valign="top" align="center">SNP</td>
<td valign="top" align="center">Breed</td>
<td valign="top" align="left">Gene (rank)</td>
<td valign="top" align="center">Reference allele</td>
<td valign="top" align="center">Alternative allele</td>
<td valign="top" align="center">Mutation</td>
<td valign="top" align="center">PolyPhen</td>
<td valign="top" align="left"><italic>q</italic>-value</td>
<td valign="top" align="left">Function</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">2</td>
<td valign="top" align="left">2,887,916</td>
<td valign="top" align="left">2,887,916</td>
<td valign="top" align="center">2,887,916</td>
<td valign="top" align="center">Lowland</td>
<td valign="top" align="left"><italic>CDK5RAP2</italic>(1)</td>
<td valign="top" align="center">A&#x002A;</td>
<td valign="top" align="center">G</td>
<td valign="top" align="center">M47V</td>
<td valign="top" align="center">0</td>
<td valign="top" align="left">0.006</td>
<td valign="top" align="left">Cell cycle</td>
</tr>
<tr>
<td valign="top" align="left">2</td>
<td valign="top" align="left">28,318,917</td>
<td valign="top" align="left">28,318,992</td>
<td valign="top" align="center"/>
<td valign="top" align="center">Upland</td>
<td valign="top" align="left"><italic>FGD3</italic>(1)</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="left">0.003</td>
<td valign="top" align="left">GTP binding</td>
</tr>
<tr>
<td valign="top" align="left">3</td>
<td valign="top" align="left">10,725,499</td>
<td valign="top" align="left">10,725,501</td>
<td valign="top" align="center"/>
<td valign="top" align="center">Upland</td>
<td valign="top" align="left"><italic>HSPA5</italic>(1)</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="left">0.007</td>
<td valign="top" align="left">Cell stress</td>
</tr>
<tr>
<td valign="top" align="left">4</td>
<td valign="top" align="left">7,476,204</td>
<td valign="top" align="left">7,476,211</td>
<td valign="top" align="center">7,476,211</td>
<td valign="top" align="center">Upland</td>
<td valign="top" align="left"><italic>ABCA13</italic>(1)</td>
<td valign="top" align="center">T&#x002A;</td>
<td valign="top" align="center">C</td>
<td valign="top" align="center">K2619Q</td>
<td valign="top" align="center">0.9</td>
<td valign="top" align="left">0.006</td>
<td valign="top" align="left">Membrane transport</td>
</tr>
<tr>
<td valign="top" align="left">4</td>
<td valign="top" align="left">47,088,764</td>
<td valign="top" align="left">47,089,276</td>
<td valign="top" align="center"/>
<td valign="top" align="center">Lowland</td>
<td valign="top" align="left"><italic>CDHR3</italic>(1)</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="left">0.004</td>
<td valign="top" align="left">Cell adhesion</td>
</tr>
<tr>
<td valign="top" align="left">7</td>
<td valign="top" align="left">84,989,884</td>
<td valign="top" align="left">84,989,669</td>
<td valign="top" align="center"/>
<td valign="top" align="center">Upland</td>
<td valign="top" align="left"><italic>VASH1</italic>(1)</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="left">0.004</td>
<td valign="top" align="left">Angiogenesis</td>
</tr>
<tr>
<td valign="top" align="left">8</td>
<td valign="top" align="left">21,197,663</td>
<td valign="top" align="left">21,198,137</td>
<td valign="top" align="center">21,197,663</td>
<td valign="top" align="center">Upland</td>
<td valign="top" align="left"><italic>RWDD1</italic>(1)</td>
<td valign="top" align="center">A</td>
<td valign="top" align="center">G&#x002A;</td>
<td valign="top" align="center">L23P</td>
<td valign="top" align="center">0.04</td>
<td valign="top" align="left">0.002</td>
<td valign="top" align="left">Anti-oxidation</td>
</tr>
<tr>
<td valign="top" align="left">13</td>
<td valign="top" align="left">49,771,782</td>
<td valign="top" align="left">49,771,855</td>
<td valign="top" align="center"/>
<td valign="top" align="center">Upland</td>
<td valign="top" align="left"><italic>UBA52</italic>(1)</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="left">0.1</td>
<td valign="top" align="left">Ubiquitinoylation</td>
</tr>
<tr>
<td valign="top" align="left">13</td>
<td valign="top" align="left">52,848,831</td>
<td valign="top" align="left">52,848,943</td>
<td valign="top" align="center"/>
<td valign="top" align="center">Upland</td>
<td valign="top" align="left"><italic>SIRPA</italic>(1)</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="left">0.006</td>
<td valign="top" align="left">Cell recognition</td>
</tr>
<tr>
<td valign="top" align="left">13</td>
<td valign="top" align="left">52,848,831</td>
<td valign="top" align="left">52,848,943</td>
<td valign="top" align="center"/>
<td valign="top" align="center">Upland</td>
<td valign="top" align="left"><italic>PTPN1</italic>(1)</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="left">0.1</td>
<td valign="top" align="left">Insulin pathway</td>
</tr>
<tr>
<td valign="top" align="left">14</td>
<td valign="top" align="left">14,231,667</td>
<td valign="top" align="left">14,232,187</td>
<td valign="top" align="center"/>
<td valign="top" align="center">Lowland</td>
<td valign="top" align="left"><italic>MC1R</italic>(1)</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="left">0.004</td>
<td valign="top" align="left">Coat color</td>
</tr>
<tr>
<td valign="top" align="left">15</td>
<td valign="top" align="left">75,351,718</td>
<td valign="top" align="left">75,352,196</td>
<td valign="top" align="center"/>
<td valign="top" align="center">Upland</td>
<td valign="top" align="left"><italic>ACP2</italic>(1)</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="left">0.006</td>
<td valign="top" align="left">Development</td>
</tr>
<tr>
<td valign="top" align="left">20</td>
<td valign="top" align="left">10,644,119</td>
<td valign="top" align="left">10,644,602</td>
<td valign="top" align="center"/>
<td valign="top" align="center">Upland</td>
<td valign="top" align="left" colspan="2"><italic>LOC10110726</italic>(1)</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center">0.009</td>
<td valign="top" align="left">Fat deposition</td>
</tr>
<tr>
<td valign="top" align="left">20</td>
<td valign="top" align="left">16,972,103</td>
<td valign="top" align="left">16,972,103</td>
<td valign="top" align="center"/>
<td valign="top" align="center">Upland</td>
<td valign="top" align="left"><italic>SLC22A7</italic>(1)</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="left">0.009</td>
<td valign="top" align="left">Cyclic nucleotide transport</td>
</tr>
<tr>
<td valign="top" align="left">22</td>
<td valign="top" align="left">15,368,530</td>
<td valign="top" align="left">15,368,926</td>
<td valign="top" align="center"/>
<td valign="top" align="center">Upland</td>
<td valign="top" align="left"><italic>NOC3L</italic>(1)</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="left">2.0 &#x00D7; 10<sup>&#x2013;8</sup></td>
<td valign="top" align="left">Cell cycle</td>
</tr>
<tr>
<td valign="top" align="left">24</td>
<td valign="top" align="left">27,106,763</td>
<td valign="top" align="left">27,106,886</td>
<td valign="top" align="center"/>
<td valign="top" align="center">Upland</td>
<td valign="top" align="left"><italic>HSD3B7</italic>(1)</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="left">0.002</td>
<td valign="top" align="left">Bile synthesis</td>
</tr>
<tr>
<td valign="top" align="left">24</td>
<td valign="top" align="left">35,794,428</td>
<td valign="top" align="left">35,794,428</td>
<td valign="top" align="center"/>
<td valign="top" align="center">Lowland/Upland</td>
<td valign="top" align="left"><italic>GIGFY</italic>(1)</td>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="center"/>
<td valign="top" align="left">0.007</td>
<td valign="top" align="left">Insulin pathway</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<attrib><italic>&#x002A;Denotes selected allele.</italic></attrib>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="S3.SS5">
<title>Candidate Genes in Welsh Upland Sheep Breeds</title>
<p>Within the upland breeds, many genes found in the selected regions had functions related to cell stress and metabolism (<xref ref-type="table" rid="T3">Table 3</xref>). The most highly supported by DCMS, <italic>RWDD1</italic>, encodes a transcription factor related to sulfide metabolism in metozoans (<xref ref-type="bibr" rid="B34">Kang et al., 2008</xref>; <xref ref-type="bibr" rid="B45">Li et al., 2018</xref>). <italic>HSPA5</italic> also responds to cell stress mechanisms by promoting protein refolding in the endoplasmic reticulum in cancers or virally-infected cells (<xref ref-type="bibr" rid="B11">Booth et al., 2015</xref>). This gene has also been found under selection in Chinese Yellow-Feathered chickens with regard to meat quality (<xref ref-type="bibr" rid="B32">Huang et al., 2020</xref>) and muscling in world pig breeds (<xref ref-type="bibr" rid="B44">Li et al., 2011</xref>).</p>
<p>Of the three genes found in the selected regions in both the genotyping and resequencing datasets, two related to cell stress mechanisms. The most significant region contains <italic>VASH1</italic>, encoding the vasohibin 1 signaling molecule, with known roles of negatively regulating angiogenesis (<xref ref-type="bibr" rid="B15">Chen et al., 2020</xref>), as well as promoting expression of antioxidation enzymes (<xref ref-type="bibr" rid="B51">Miyashita et al., 2012</xref>). Age-related downregulation of <italic>VASH1</italic> leads to a lower endothelial cell stress tolerance, posing as a risk factor for human vascular diseases in later life (<xref ref-type="bibr" rid="B67">Takeda et al., 2016</xref>). Secondly, <italic>UBA52</italic> encodes a protein with an ubiquitinate activity, with its downregulation causing cell cycle arrest and reduced protein synthesis essential for pre-implantation embryogenesis success in mouse models (<xref ref-type="bibr" rid="B39">Kobayashi et al., 2016</xref>).</p>
<p>Several genes related to metabolism and growth were found under selection in the upland breeds. The most significant of these, <italic>HSD3B7</italic>, is part of the <italic>bile biosynthesis</italic> pathway (<xref ref-type="bibr" rid="B16">Cheng et al., 2003</xref>). <italic>PTPN1</italic> is a risk-factor gene linked to diabetes and obesity (<xref ref-type="bibr" rid="B54">Olivier et al., 2004</xref>), which has a direct involvement in the <italic>insulin</italic> and <italic>leptin signaling pathways</italic>, and that mice lacking this gene were resistant to weight gain and intolerant to glucose (<xref ref-type="bibr" rid="B21">Elchebly et al., 1999</xref>). <italic>GIGYF1</italic> also has roles in enhancing the insulin receptor pathway, but additionally has been linked to translational repression (<xref ref-type="bibr" rid="B26">Giovannone et al., 2003</xref>; <xref ref-type="bibr" rid="B68">Tollenaere et al., 2019</xref>). Similar effects have been seen with <italic>APC2</italic>, which is linked to muscle mass in mice (<xref ref-type="bibr" rid="B35">K&#x00E4;rst et al., 2011</xref>). The Rho-GEF-containing gene <italic>FGD3</italic>, expressed in the growth plate of long bones, was previously found under selection in French Trotter and Gidran horses, as well as in Jutland and Japanese black cattle in association to birth weight (<xref ref-type="bibr" rid="B66">Takasuga et al., 2015</xref>; <xref ref-type="bibr" rid="B28">Grilz-Seger et al., 2019</xref>; <xref ref-type="bibr" rid="B63">Stronen et al., 2019</xref>).</p>
<p>Two membrane transport proteins, ABCA13 and SLC22A7, were found to be in the regions under selection in the upland breeds. <italic>ABCA13</italic> encodes a member of the ATP-binding cassette membrane transporter family, responsible for the active transport of biological substrates across cell membranes (<xref ref-type="bibr" rid="B57">Prades et al., 2002</xref>). Secondly, <italic>SLC22A7</italic>, a transmembrane solute carrier, with roles in cAMP and cGMP transport in mammalian tissues and, therefore, is important for intracellular signaling which may mobilize intracellular Ca<sup>2+</sup>, activate protein kinases, or activate transcription factors (<xref ref-type="bibr" rid="B40">Kobayashi et al., 2005</xref>; <xref ref-type="bibr" rid="B75">Yan et al., 2016</xref>). The final gene shared between the genotyping and resequencing data was <italic>SIRPA</italic>, which is expressed by macrophages and polarizes M1 phagocytic macrophages to M2 antiphagocytic macrophages, which is a key survival strategy for tumors (<xref ref-type="bibr" rid="B4">Barclay and van den Berg, 2014</xref>).</p>
</sec>
<sec id="S3.SS6">
<title>Gene Ontology Enrichments Show Adaptations to Environment in the Resequenced Lowland and Upland Breeds</title>
<p>Nine functional category enrichments were found from genes within CNVRs in the lowland breeds and 14 enrichments in the upland breeds (<xref ref-type="supplementary-material" rid="SM2">Supplementary Tables 27</xref>,<xref ref-type="supplementary-material" rid="SM2">28</xref>). Some of these enrichments were shared between the lowland and upland breeds. These were semaphorins; ion transport, pleckstrin homology domain; SAND domains; and EGF-like domains. Exclusive enrichments in the lowland breeds&#x2019; CNVRs included cell surface receptors, neuromuscular process, and DNA binding whereas exclusive enrichments in the upland breeds included Src homology-3 domain Rho signal transduction, Notch signaling, and chondrocyte differentiation (1.4-fold). Genes within the regions under selection in the upland breeds showed significantly enriched clusters including interleukin-1 and ATP-binding (<xref ref-type="supplementary-material" rid="SM2">Supplementary Table 29</xref>). No functional category enrichments were found in genes in the regions under selection in the lowland breeds.</p>
</sec>
</sec>
<sec id="S4">
<title>Discussion</title>
<p>Our study has demonstrated that regions under putative selection in Welsh sheep genomes contain candidate genes for adaptation to their local environment and production of socioeconomic traits. We used a large set of animals genotyped on a relatively small number of SNPs, applying the haplotype and point-based selection scan algorithms. This was combined with a relatively small number of resequenced individuals subjected to point-based selection scan. As a result, we detected genomic regions under selection in individual and groups of breeds, including candidate missense variants within these regions. Regions under selection detected by the three approaches followed the expected patterns seen previously that the haplotype-based approach would detect larger but fewer regions than the point-based approach, which detected smaller, but more numerous regions under selection (<xref ref-type="bibr" rid="B79">Yurchenko et al., 2019</xref>).</p>
<p>Exposure to altitudes has a range of deleterious effects caused by hypoxia, exposure to ultraviolet radiation, and generation of oxygen radicals. These, in turn, have been linked to a negative energy balance, dysregulated proteostasis, cellular stress mechanisms, and DNA damage (<xref ref-type="bibr" rid="B3">Askew, 2002</xref>; <xref ref-type="bibr" rid="B55">Pasiakos et al., 2017</xref>). Therefore, the presence of genes related to cell-stress and anti-oxidation in the regions under selection gives reassurance that the results from this study are relevant to the adaptations of Welsh sheep to altitudes. Genes related to hypoxia, however, were not identified in the regions under selection in the upland breeds, so it can be assumed that it is not a stress factor for these breeds because the altitudes they are farmed at are only moderate. Furthermore, body conditioning genes, such as <italic>FDG3</italic> and <italic>ACP2</italic>, in the upland breeds also suggest physical mechanisms of adaptation, such as increased fat deposition and muscle mass, however, these could also be linked to socioeconomic performance (<xref ref-type="bibr" rid="B26">Giovannone et al., 2003</xref>; <xref ref-type="bibr" rid="B7">Bento et al., 2004</xref>; <xref ref-type="bibr" rid="B29">Gu et al., 2011</xref>; <xref ref-type="bibr" rid="B35">K&#x00E4;rst et al., 2011</xref>; <xref ref-type="bibr" rid="B28">Grilz-Seger et al., 2019</xref>).</p>
<p>We observed selection at the loci of other top-ranking candidates from the haplotype analysis with known roles in energy consumption, liver metabolism, milking, fat deposition, and angiogenesis (<xref ref-type="bibr" rid="B77">Yang et al., 2016</xref>; <xref ref-type="bibr" rid="B2">Armstrong et al., 2018</xref>; <xref ref-type="bibr" rid="B58">Pszczola et al., 2018</xref>). These findings, showing the top-ranking genes sharing functions of that in the resequencing study, provide many candidate genes relating to survivability and socioeconomic traits in Welsh upland sheep. Further evidence of selection in these breeds can be seen from functional term enrichments in genes found in the selected regions and in CNVRs.</p>
<p>Lowland breeds showed less signatures of selection, however, they mainly had selection in regions containing genes known to be associated with domestication, which are commonly reported signatures of selection in world sheep breeds (<xref ref-type="bibr" rid="B36">Kijas et al., 2012</xref>; <xref ref-type="bibr" rid="B72">Wei et al., 2015</xref>; <xref ref-type="bibr" rid="B70">Wang et al., 2019</xref>; <xref ref-type="bibr" rid="B46">Li et al., 2020</xref>). By demonstrating the lowland breeds sharing the signatures of selection with other productive breeds, this indicates that they are better suited for productive qualities but do not show an adaptation for the Welsh uplands. Despite this, selection for <italic>CDK5RAP2</italic> seen in the lowland breeds of the resequencing study may be linked to upland adaptation as mice models with truncating mutations have lower red blood cell counts, however, this is true for white blood cells too, and so, may be linked to immunity traits as well as neurodevelopment (<xref ref-type="bibr" rid="B5">Barker and Bernstein, 1983</xref>).</p>
<p>Differences in the results when using the genotyping and resequencing data were expected and can be attested to an increased density of SNPs in the resequencing data and a different composition of populations used for each study. The former effect would be expected to lead to narrower regions being detected under selection in the resequencing dataset, which could shift the most significant SNP away from candidate genes detected from the genotyping data. Secondly, using groups of multiple breeds could mean that whilst haplotypes often remain similar amongst closely related breeds, certain point mutations that differentiate those breeds from each other may become diluted in frequency, and so, would not be considered under selection by this method when a small number of animals is used. This is likely the case where, lowland breeds show less signatures of selection than upland breeds, suggesting that they share less signatures when grouped. This postulates that Welsh lowland breeds are more diverse than the upland breeds, supported by data from <xref ref-type="bibr" rid="B8">Beynon et al. (2015)</xref>, which could be in response to the demand for socioeconomic traits and lack of selection pressures in comparison to the upland breeds, where there seem to be a selective pressure on the same region, leading to shared signatures of selection. This further suggests that the lowland breeds have been selected for the production of socioeconomic traits, rather than adaptation to their local environment.</p>
<p>Lower costs of genome resequencing have allowed a deeper insight to the individual mutations that could have functional roles within a region under selection; however, this is not always a realistic approach when investigating many related breeds in a single study. Our method here has demonstrated reliability in using resequencing data from a small number of individuals of different breeds but applied to similar environments can be supported by genotyping many individuals of these breeds. This is truer with the upland Welsh breeds, which is most likely due to the higher environmental selective pressures applied when compared to the lowland breeds. This has greatly eluted candidate genes relating to hardiness and survivability in both the genotyping and resequencing data.</p>
</sec>
<sec id="S5">
<title>Conclusion</title>
<p>Here, we have seen the first investigation into signatures of selection in Welsh sheep breeds using a large number of genotyped individuals and a small number of whole-genome resequenced individuals. Statistical pipelines have shown selection in Welsh upland breeds in regions containing genes relating to adaptation to the local environment, including candidate genetic variants, as well as some genes related to the production of socioeconomic traits in the lowland breeds. In turn, this information is useful, not only for the conservation of these culturally important breeds, but also for the improved production capabilities of mountain breeds and adaptation of productive breeds through a marker-assisted selection.</p>
</sec>
<sec id="S6">
<title>Data Availability Statement</title>
<p>The original contributions presented in the study are publicly available in NCBI using accession number <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA646642">PRJNA646642</ext-link>.</p>
</sec>
<sec id="S7">
<title>Author Contributions</title>
<p>DL: leading the project, sample collection, and writing the manuscript. JS-J: running the analyses and drafting the manuscript. VL: genome sequencing of Welsh sheep samples and initial analysis. AY: analysis pipeline development. NY: sample collection and manuscript editing. MS: Welsh sheep sequencing and initial analysis. All authors edited the manuscript.</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</body>
<back>
<fn-group>
<fn fn-type="financial-disclosure">
<p><bold>Funding.</bold> The collection and sequencing of Russian sheep samples used in this study were funded by the Russian Scientific Foundation grant 19-76-20026 to DL. Resources from HPC Wales and Supercomputing Wales supported the contributions of VL and MS.</p>
</fn>
</fn-group>
<sec id="S9" sec-type="supplementary material">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fgene.2021.612492/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fgene.2021.612492/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.PDF" id="SM1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Data_Sheet_2.xlsx" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Adzhubei</surname> <given-names>I.</given-names></name> <name><surname>Jordan</surname> <given-names>D. M.</given-names></name> <name><surname>Sunyaev</surname> <given-names>S. R.</given-names></name></person-group> (<year>2013</year>). <article-title>Predicting functional effect of human missense mutations using PolyPhen-2.</article-title> <source><italic>Curr. Protoc. Hum. Genet.</italic></source> <volume>Chapter 7</volume>:<issue>Unit7.20</issue>. <pub-id pub-id-type="doi">10.1002/0471142905.hg0720s76</pub-id> <pub-id pub-id-type="pmid">23315928</pub-id></citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Armstrong</surname> <given-names>E.</given-names></name> <name><surname>Ciappesoni</surname> <given-names>G.</given-names></name> <name><surname>Iriarte</surname> <given-names>W.</given-names></name> <name><surname>Da Silva</surname> <given-names>C.</given-names></name> <name><surname>Macedo</surname> <given-names>F.</given-names></name> <name><surname>Navajas</surname> <given-names>E. A.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Novel genetic polymorphisms associated with carcass traits in grazing Texel sheep.</article-title> <source><italic>Meat Sci.</italic></source> <volume>145</volume> <fpage>202</fpage>&#x2013;<lpage>208</lpage>. <pub-id pub-id-type="doi">10.1016/j.meatsci.2018.06.014</pub-id> <pub-id pub-id-type="pmid">29982074</pub-id></citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Askew</surname> <given-names>E. W.</given-names></name></person-group> (<year>2002</year>). <article-title>Work at high altitude and oxidative stress: antioxidant nutrients.</article-title> <source><italic>Toxicology</italic></source> <volume>180</volume> <fpage>107</fpage>&#x2013;<lpage>119</lpage>. <pub-id pub-id-type="doi">10.1016/S0300-483X(02)00385-2</pub-id></citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Barclay</surname> <given-names>A. N.</given-names></name> <name><surname>van den Berg</surname> <given-names>T. K.</given-names></name></person-group> (<year>2014</year>). <article-title>The interaction between signal regulatory protein alpha (SIRP&#x03B1;) and CD47: structure, function, and therapeutic target.</article-title> <source><italic>Annu. Rev. Immunol.</italic></source> <volume>32</volume> <fpage>25</fpage>&#x2013;<lpage>50</lpage>. <pub-id pub-id-type="doi">10.1146/annurev-immunol-032713-120142</pub-id> <pub-id pub-id-type="pmid">24215318</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Barker</surname> <given-names>J.</given-names></name> <name><surname>Bernstein</surname> <given-names>S.</given-names></name></person-group> (<year>1983</year>). <article-title>Hertwig&#x2019;s anemia: characterization of the stem cell defect.</article-title> <source><italic>Blood</italic></source> <volume>61</volume> <fpage>765</fpage>&#x2013;<lpage>769</lpage>. <pub-id pub-id-type="doi">10.1182/blood.v61.4.765.bloodjournal614765</pub-id></citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Benavides</surname> <given-names>M. V.</given-names></name> <name><surname>Sonstegard</surname> <given-names>T. S.</given-names></name> <name><surname>Kemp</surname> <given-names>S.</given-names></name> <name><surname>Mugambi</surname> <given-names>J. M.</given-names></name> <name><surname>Gibson</surname> <given-names>J. P.</given-names></name> <name><surname>Baker</surname> <given-names>R. L.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Identification of novel loci associated with gastrointestinal parasite resistance in a Red Maasai x Dorper backcross population.</article-title> <source><italic>PLoS One</italic></source> <volume>10</volume>:<issue>e0122797</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0122797</pub-id> <pub-id pub-id-type="pmid">25867089</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bento</surname> <given-names>J. L.</given-names></name> <name><surname>Palmer</surname> <given-names>N. D.</given-names></name> <name><surname>Mychaleckyj</surname> <given-names>J. C.</given-names></name> <name><surname>Lange</surname> <given-names>L. A.</given-names></name> <name><surname>Langefeld</surname> <given-names>C. D.</given-names></name> <name><surname>Rich</surname> <given-names>S. S.</given-names></name><etal/></person-group> (<year>2004</year>). <article-title>Association of protein tyrosine phosphatase 1B gene polymorphisms with type 2 diabetes.</article-title> <source><italic>Diabetes</italic></source> <volume>53</volume>:<issue>3007</issue>. <pub-id pub-id-type="doi">10.2337/diabetes.53.11.3007</pub-id> <pub-id pub-id-type="pmid">15504984</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Beynon</surname> <given-names>S. E.</given-names></name> <name><surname>Slavov</surname> <given-names>G. T.</given-names></name> <name><surname>Farr&#x00E9;</surname> <given-names>M.</given-names></name> <name><surname>Sunduimijid</surname> <given-names>B.</given-names></name> <name><surname>Waddams</surname> <given-names>K.</given-names></name> <name><surname>Davies</surname> <given-names>B.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Population structure and history of the Welsh sheep breeds determined by whole genome genotyping.</article-title> <source><italic>BMC Genet.</italic></source> <volume>16</volume>:<issue>65</issue>. <pub-id pub-id-type="doi">10.1186/s12863-015-0216-x</pub-id> <pub-id pub-id-type="pmid">26091804</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bochkov</surname> <given-names>Y. A.</given-names></name> <name><surname>Watters</surname> <given-names>K.</given-names></name> <name><surname>Ashraf</surname> <given-names>S.</given-names></name> <name><surname>Griggs</surname> <given-names>T. F.</given-names></name> <name><surname>Devries</surname> <given-names>M. K.</given-names></name> <name><surname>Jackson</surname> <given-names>D. J.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Cadherin-related family member 3, a childhood asthma susceptibility gene product, mediates rhinovirus C binding and replication.</article-title> <source><italic>Proc. Natl. Acad. Sci. U S A.</italic></source> <volume>112</volume>, <fpage>5485</fpage>&#x2013;<lpage>5490</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1421178112</pub-id> <pub-id pub-id-type="pmid">25848009</pub-id></citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bonhomme</surname> <given-names>M.</given-names></name> <name><surname>Chevalet</surname> <given-names>C.</given-names></name> <name><surname>Servin</surname> <given-names>B.</given-names></name> <name><surname>Boitard</surname> <given-names>S.</given-names></name> <name><surname>Abdallah</surname> <given-names>J.</given-names></name> <name><surname>Blott</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2010</year>). <article-title>Detecting selection in population trees: the Lewontin and Krakauer test extended.</article-title> <source><italic>Genetics</italic></source> <volume>186</volume> <fpage>241</fpage>&#x2013;<lpage>262</lpage>. <pub-id pub-id-type="doi">10.1534/genetics.104.117275</pub-id> <pub-id pub-id-type="pmid">20855576</pub-id></citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Booth</surname> <given-names>L.</given-names></name> <name><surname>Roberts</surname> <given-names>J. L.</given-names></name> <name><surname>Dent</surname> <given-names>P.</given-names></name></person-group> (<year>2015</year>). <article-title>HSPA5/Dna K may be a useful target for human disease therapies.</article-title> <source><italic>DNA Cell Biol.</italic></source> <volume>34</volume> <fpage>153</fpage>&#x2013;<lpage>158</lpage>. <pub-id pub-id-type="doi">10.1089/dna.2015.2808</pub-id> <pub-id pub-id-type="pmid">25689303</pub-id></citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bovo</surname> <given-names>S.</given-names></name> <name><surname>Mazzoni</surname> <given-names>G.</given-names></name> <name><surname>Bertolini</surname> <given-names>F.</given-names></name> <name><surname>Schiavo</surname> <given-names>G.</given-names></name> <name><surname>Galimberti</surname> <given-names>G.</given-names></name> <name><surname>Gallo</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Genome-wide association studies for 30 haematological and blood clinical-biochemical traits in Large White pigs reveal genomic regions affecting intermediate phenotypes.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>9</volume>:<issue>7003</issue>. <pub-id pub-id-type="doi">10.1038/s41598-019-43297-1</pub-id> <pub-id pub-id-type="pmid">31065004</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bowles</surname> <given-names>D.</given-names></name></person-group> (<year>2015</year>). <article-title>Recent advances in understanding the genetic resources of sheep breeds locally adapted to the UK uplands: opportunities they offer for sustainable productivity.</article-title> <source><italic>Front. Genet.</italic></source> <volume>6</volume>. <pub-id pub-id-type="doi">10.3389/fgene.2015.00024</pub-id> <pub-id pub-id-type="pmid">25729388</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bowles</surname> <given-names>D.</given-names></name> <name><surname>Carson</surname> <given-names>A.</given-names></name> <name><surname>Isaac</surname> <given-names>P.</given-names></name></person-group> (<year>2014</year>). <article-title>Genetic distinctiveness of the Herdwick sheep breed and two other locally adapted hill breeds of the UK.</article-title> <source><italic>PLoS One</italic></source> <volume>9</volume>:<issue>e87823</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0087823</pub-id> <pub-id pub-id-type="pmid">24489968</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>C. Y.</given-names></name> <name><surname>Salomon</surname> <given-names>A. K.</given-names></name> <name><surname>Caporizzo</surname> <given-names>M. A.</given-names></name> <name><surname>Curry</surname> <given-names>S.</given-names></name> <name><surname>Kelly</surname> <given-names>N. A.</given-names></name> <name><surname>Bedi</surname> <given-names>K. C.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>Depletion of vasohibin 1 speeds contraction and relaxation in failing human cardiomyocytes.</article-title> <source><italic>Circ. Res.</italic></source> <volume>127</volume> <fpage>e14</fpage>&#x2013;<lpage>e27</lpage>. <pub-id pub-id-type="doi">10.1161/CIRCRESAHA.119.315947</pub-id> <pub-id pub-id-type="pmid">32272864</pub-id></citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cheng</surname> <given-names>J. B.</given-names></name> <name><surname>Jacquemin</surname> <given-names>E.</given-names></name> <name><surname>Gerhardt</surname> <given-names>M.</given-names></name> <name><surname>Nazer</surname> <given-names>H.</given-names></name> <name><surname>Cresteil</surname> <given-names>D.</given-names></name> <name><surname>Heubi</surname> <given-names>J. E.</given-names></name><etal/></person-group> (<year>2003</year>). <article-title>Molecular genetics of 3&#x03B2;-hydroxy-&#x03B4;5-c27-steroid oxidoreductase deficiency in 16 patients with loss of bile acid synthesis and liver disease.</article-title> <source><italic>J. Clin. Endocrinol. Metab.</italic></source> <volume>88</volume> <fpage>1833</fpage>&#x2013;<lpage>1841</lpage>. <pub-id pub-id-type="doi">10.1210/jc.2002-021580</pub-id> <pub-id pub-id-type="pmid">12679481</pub-id></citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Danecek</surname> <given-names>P.</given-names></name> <name><surname>Auton</surname> <given-names>A.</given-names></name> <name><surname>Abecasis</surname> <given-names>G.</given-names></name> <name><surname>Albers</surname> <given-names>C. A.</given-names></name> <name><surname>Banks</surname> <given-names>E.</given-names></name> <name><surname>DePristo</surname> <given-names>M. A.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>The variant call format and VCFtools.</article-title> <source><italic>Bioinformatics</italic></source> <volume>27</volume>, <fpage>2156</fpage>&#x2013;<lpage>2158</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btr330</pub-id> <pub-id pub-id-type="pmid">21653522</pub-id></citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Davies</surname> <given-names>E.</given-names></name></person-group> (<year>1935</year>). <article-title>Sheep farming in Upland Wales.</article-title> <source><italic>Geography</italic></source> <volume>20</volume> <fpage>97</fpage>&#x2013;<lpage>111</lpage>.</citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dekker</surname> <given-names>N.</given-names></name> <name><surname>Voorn-Brouwer</surname> <given-names>T.</given-names></name> <name><surname>Verhoek</surname> <given-names>M.</given-names></name> <name><surname>Wennekes</surname> <given-names>T.</given-names></name> <name><surname>Narayan</surname> <given-names>R. S.</given-names></name> <name><surname>Speijer</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>The cytosolic &#x03B2;-glucosidase GBA3 does not influence type 1 Gaucher disease manifestation.</article-title> <source><italic>Blood Cells Mol. Dis.</italic></source> <volume>46</volume> <fpage>19</fpage>&#x2013;<lpage>26</lpage>. <pub-id pub-id-type="doi">10.1016/j.bcmd.2010.07.009</pub-id> <pub-id pub-id-type="pmid">20728381</pub-id></citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Delaneau</surname> <given-names>O.</given-names></name> <name><surname>Marchini</surname> <given-names>J.</given-names></name> <name><surname>Zagury</surname> <given-names>J.-F.</given-names></name></person-group> (<year>2011</year>). <article-title>A linear complexity phasing method for thousands of genomes.</article-title> <source><italic>Nat. Methods</italic></source> <volume>9</volume> <fpage>179</fpage>&#x2013;<lpage>181</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.1785</pub-id> <pub-id pub-id-type="pmid">22138821</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Elchebly</surname> <given-names>M.</given-names></name> <name><surname>Payette</surname> <given-names>P.</given-names></name> <name><surname>Michaliszyn</surname> <given-names>E.</given-names></name> <name><surname>Cromlish</surname> <given-names>W.</given-names></name> <name><surname>Collins</surname> <given-names>S.</given-names></name> <name><surname>Loy</surname> <given-names>A. L.</given-names></name><etal/></person-group> (<year>1999</year>). <article-title>Increased insulin sensitivity and obesity resistance in mice lacking the protein tyrosine phosphatase-1B gene.</article-title> <source><italic>Science</italic></source> <volume>283</volume>:<issue>1544</issue>. <pub-id pub-id-type="doi">10.1126/science.283.5407.1544</pub-id> <pub-id pub-id-type="pmid">10066179</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fariello</surname> <given-names>M. I.</given-names></name> <name><surname>Boitard</surname> <given-names>S.</given-names></name> <name><surname>Naya</surname> <given-names>H.</given-names></name> <name><surname>SanCristobal</surname> <given-names>M.</given-names></name> <name><surname>Servin</surname> <given-names>B.</given-names></name></person-group> (<year>2013</year>). <article-title>Detecting signatures of selection through haplotype differentiation among hierarchically structured populations.</article-title> <source><italic>Genetics</italic></source> <volume>193</volume> <fpage>929</fpage>&#x2013;<lpage>941</lpage>. <pub-id pub-id-type="doi">10.1534/genetics.112.147231</pub-id> <pub-id pub-id-type="pmid">23307896</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fariello</surname> <given-names>M.-I.</given-names></name> <name><surname>Servin</surname> <given-names>B.</given-names></name> <name><surname>Tosser-Klopp</surname> <given-names>G.</given-names></name> <name><surname>Rupp</surname> <given-names>R.</given-names></name> <name><surname>Moreno</surname> <given-names>C.</given-names></name> <name><surname>Consortium</surname> <given-names>I. S. G.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Selection signatures in worldwide sheep populations.</article-title> <source><italic>PLoS One</italic></source> <volume>9</volume>:<issue>e103813</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0103813</pub-id> <pub-id pub-id-type="pmid">25126940</pub-id></citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fernandez-Marcos</surname> <given-names>P. J.</given-names></name> <name><surname>Auwerx</surname> <given-names>J.</given-names></name></person-group> (<year>2011</year>). <article-title>Regulation of PGC-1&#x03B1;, a nodal regulator of mitochondrial biogenesis.</article-title> <source><italic>Am. J. Clin. Nutr.</italic></source> <volume>93</volume> <fpage>884S</fpage>&#x2013;<lpage>890S</lpage>. <pub-id pub-id-type="doi">10.3945/ajcn.110.001917</pub-id> <pub-id pub-id-type="pmid">21289221</pub-id></citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Garud</surname> <given-names>N. R.</given-names></name> <name><surname>Messer</surname> <given-names>P. W.</given-names></name> <name><surname>Buzbas</surname> <given-names>E. O.</given-names></name> <name><surname>Petrov</surname> <given-names>D. A.</given-names></name></person-group> (<year>2015</year>). <article-title>Recent selective sweeps in north american <italic>Drosophila</italic> melanogaster show signatures of soft sweeps.</article-title> <source><italic>PLoS Genet.</italic></source> <volume>11</volume>:<issue>e1005004</issue>. <pub-id pub-id-type="doi">10.1371/journal.pgen.1005004</pub-id> <pub-id pub-id-type="pmid">25706129</pub-id></citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Giovannone</surname> <given-names>B.</given-names></name> <name><surname>Lee</surname> <given-names>E.</given-names></name> <name><surname>Laviola</surname> <given-names>L.</given-names></name> <name><surname>Giorgino</surname> <given-names>F.</given-names></name> <name><surname>Cleveland</surname> <given-names>K. A.</given-names></name> <name><surname>Smith</surname> <given-names>R. J.</given-names></name></person-group> (<year>2003</year>). <article-title>Two novel proteins that are linked to insulin-like growth factor (IGF-I) receptors by the Grb10 adapter and modulate IGF-I signalling.</article-title> <source><italic>J. Biol. Chem.</italic></source> <volume>278</volume> <fpage>31564</fpage>&#x2013;<lpage>31573</lpage>. <pub-id pub-id-type="doi">10.1074/JBC.M211572200</pub-id> <pub-id pub-id-type="pmid">12771153</pub-id></citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Grant</surname> <given-names>J. R.</given-names></name> <name><surname>Arantes</surname> <given-names>A. S.</given-names></name> <name><surname>Liao</surname> <given-names>X.</given-names></name> <name><surname>Stothard</surname> <given-names>P.</given-names></name></person-group> (<year>2011</year>). <article-title>In-depth annotation of SNPs arising from resequencing projects using NGS-SNP.</article-title> <source><italic>Bioinformatics</italic></source> <volume>27</volume> <fpage>2300</fpage>&#x2013;<lpage>2301</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btr372</pub-id> <pub-id pub-id-type="pmid">21697123</pub-id></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Grilz-Seger</surname> <given-names>G.</given-names></name> <name><surname>Neuditschko</surname> <given-names>M.</given-names></name> <name><surname>Ricard</surname> <given-names>A.</given-names></name> <name><surname>Velie</surname> <given-names>B.</given-names></name> <name><surname>Lindgren</surname> <given-names>G.</given-names></name> <name><surname>Mesari&#x010D;</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Genome-wide homozygosity patterns and evidence for selection in a set of European and Near Eastern horse breeds.</article-title> <source><italic>Genes (Basel)</italic></source> <volume>10</volume>:<issue>491</issue>. <pub-id pub-id-type="doi">10.3390/genes10070491</pub-id> <pub-id pub-id-type="pmid">31261764</pub-id></citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gu</surname> <given-names>X.</given-names></name> <name><surname>Feng</surname> <given-names>C.</given-names></name> <name><surname>Ma</surname> <given-names>L.</given-names></name> <name><surname>Song</surname> <given-names>C.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Da</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>Genome-wide association study of body weight in chicken F2 resource population.</article-title> <source><italic>PLoS One</italic></source> <volume>6</volume>:<issue>e21872</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0021872</pub-id> <pub-id pub-id-type="pmid">21779344</pub-id></citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Heaton</surname> <given-names>M. P.</given-names></name> <name><surname>Leymaster</surname> <given-names>K. A.</given-names></name> <name><surname>Kalbfleisch</surname> <given-names>T. S.</given-names></name> <name><surname>Kijas</surname> <given-names>J. W.</given-names></name> <name><surname>Clarke</surname> <given-names>S. M.</given-names></name> <name><surname>McEwan</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>SNPs for parentage testing and traceability in globally diverse breeds of sheep.</article-title> <source><italic>PLoS One</italic></source> <volume>9</volume>:<issue>e94851</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0094851</pub-id> <pub-id pub-id-type="pmid">24740156</pub-id></citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>D. W.</given-names></name> <name><surname>Sherman</surname> <given-names>B. T.</given-names></name> <name><surname>Lempicki</surname> <given-names>R. A.</given-names></name></person-group> (<year>2009</year>). <article-title>Systematic and integrative analysis of large gene lists using DAVID bioinformatics resources.</article-title> <source><italic>Nat. Protoc.</italic></source> <volume>4</volume> <fpage>44</fpage>&#x2013;<lpage>57</lpage>. <pub-id pub-id-type="doi">10.1038/nprot.2008.211</pub-id> <pub-id pub-id-type="pmid">19131956</pub-id></citation></ref>
<ref id="B32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>X.</given-names></name> <name><surname>Otecko</surname> <given-names>N. O.</given-names></name> <name><surname>Peng</surname> <given-names>M.</given-names></name> <name><surname>Weng</surname> <given-names>Z.</given-names></name> <name><surname>Li</surname> <given-names>W.</given-names></name> <name><surname>Chen</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>Genome-wide genetic structure and selection signatures for color in 10 traditional Chinese yellow-feathered chicken breeds.</article-title> <source><italic>BMC Genomics</italic></source> <volume>21</volume>:<issue>316</issue>. <pub-id pub-id-type="doi">10.1186/s12864-020-6736-4</pub-id> <pub-id pub-id-type="pmid">32312230</pub-id></citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Issa</surname> <given-names>L.</given-names></name> <name><surname>Mueller</surname> <given-names>K.</given-names></name> <name><surname>Seufert</surname> <given-names>K.</given-names></name> <name><surname>Kraemer</surname> <given-names>N.</given-names></name> <name><surname>Rosenkotter</surname> <given-names>H.</given-names></name> <name><surname>Ninnemann</surname> <given-names>O.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Clinical and cellular features in patients with primary autosomal recessive microcephaly and a novel CDK5RAP2 mutation.</article-title> <source><italic>Orphanet J. Rare Dis.</italic></source> <volume>8</volume>:<issue>59</issue>. <pub-id pub-id-type="doi">10.1186/1750-1172-8-59</pub-id> <pub-id pub-id-type="pmid">23587236</pub-id></citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kang</surname> <given-names>N.</given-names></name> <name><surname>Chen</surname> <given-names>D.</given-names></name> <name><surname>Wang</surname> <given-names>L.</given-names></name> <name><surname>Duan</surname> <given-names>L.</given-names></name> <name><surname>Liu</surname> <given-names>S.</given-names></name> <name><surname>Tang</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2008</year>). <article-title>Rwdd1, a thymus aging related molecule, is a new member of the intrinsically unstructured protein family.</article-title> <source><italic>Cell. Mol. Immunol.</italic></source> <volume>5</volume> <fpage>333</fpage>&#x2013;<lpage>339</lpage>. <pub-id pub-id-type="doi">10.1038/cmi.2008.41</pub-id> <pub-id pub-id-type="pmid">18954556</pub-id></citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>K&#x00E4;rst</surname> <given-names>S.</given-names></name> <name><surname>Cheng</surname> <given-names>R.</given-names></name> <name><surname>Schmitt</surname> <given-names>A. O.</given-names></name> <name><surname>Yang</surname> <given-names>H.</given-names></name> <name><surname>de Villena</surname> <given-names>F. P. M.</given-names></name> <name><surname>Palmer</surname> <given-names>A. A.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>Genetic determinants for intramuscular fat content and water-holding capacity in mice selected for high muscle mass.</article-title> <source><italic>Mamm. Genome</italic></source> <volume>22</volume> <fpage>530</fpage>&#x2013;<lpage>543</lpage>. <pub-id pub-id-type="doi">10.1007/s00335-011-9342-6</pub-id> <pub-id pub-id-type="pmid">21732194</pub-id></citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kijas</surname> <given-names>J. W.</given-names></name> <name><surname>Lenstra</surname> <given-names>J. A.</given-names></name> <name><surname>Hayes</surname> <given-names>B.</given-names></name> <name><surname>Boitard</surname> <given-names>S.</given-names></name> <name><surname>Porto Neto</surname> <given-names>L. R.</given-names></name> <name><surname>San Cristobal</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Genome-wide analysis of the world&#x2019;s sheep breeds reveals high levels of historic mixture and strong recent selection.</article-title> <source><italic>PLoS Biol.</italic></source> <volume>10</volume>:<issue>e1001258</issue>. <pub-id pub-id-type="doi">10.1371/journal.pbio.1001258</pub-id> <pub-id pub-id-type="pmid">22346734</pub-id></citation></ref>
<ref id="B37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname> <given-names>E.-S.</given-names></name> <name><surname>Elbeltagy</surname> <given-names>A. R.</given-names></name> <name><surname>Aboul-Naga</surname> <given-names>A. M.</given-names></name> <name><surname>Rischkowsky</surname> <given-names>B.</given-names></name> <name><surname>Sayre</surname> <given-names>B.</given-names></name> <name><surname>Mwacharo</surname> <given-names>J. M.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Multiple genomic signatures of selection in goats and sheep indigenous to a hot arid environment.</article-title> <source><italic>Heredity (Edinb)</italic></source> <volume>116</volume> <fpage>255</fpage>&#x2013;<lpage>264</lpage>. <pub-id pub-id-type="doi">10.1038/hdy.2015.94</pub-id> <pub-id pub-id-type="pmid">26555032</pub-id></citation></ref>
<ref id="B38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Klambauer</surname> <given-names>G.</given-names></name> <name><surname>Schwarzbauer</surname> <given-names>K.</given-names></name> <name><surname>Mayr</surname> <given-names>A.</given-names></name> <name><surname>Clevert</surname> <given-names>D.-A.</given-names></name> <name><surname>Mitterecker</surname> <given-names>A.</given-names></name> <name><surname>Bodenhofer</surname> <given-names>U.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>cn.MOPS: mixture of Poissons for discovering copy number variations in next-generation sequencing data with a low false discovery rate.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>40</volume>:<issue>e69</issue>. <pub-id pub-id-type="doi">10.1093/nar/gks003</pub-id> <pub-id pub-id-type="pmid">22302147</pub-id></citation></ref>
<ref id="B39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kobayashi</surname> <given-names>M.</given-names></name> <name><surname>Oshima</surname> <given-names>S.</given-names></name> <name><surname>Maeyashiki</surname> <given-names>C.</given-names></name> <name><surname>Nibe</surname> <given-names>Y.</given-names></name> <name><surname>Otsubo</surname> <given-names>K.</given-names></name> <name><surname>Matsuzawa</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>The ubiquitin hybrid gene UBA52 regulates ubiquitination of ribosome and sustains embryonic development.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>6</volume>:<issue>36780</issue>. <pub-id pub-id-type="doi">10.1038/srep36780</pub-id> <pub-id pub-id-type="pmid">27829658</pub-id></citation></ref>
<ref id="B40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kobayashi</surname> <given-names>Y.</given-names></name> <name><surname>Ohshiro</surname> <given-names>N.</given-names></name> <name><surname>Sakai</surname> <given-names>R.</given-names></name> <name><surname>Ohbayashi</surname> <given-names>M.</given-names></name> <name><surname>Kohyama</surname> <given-names>N.</given-names></name> <name><surname>Yamamoto</surname> <given-names>T.</given-names></name></person-group> (<year>2005</year>). <article-title>Transport mechanism and substrate specificity of human organic anion transporter 2 (hOat2 [SLC22A7]).</article-title> <source><italic>J. Pharm. Pharmacol.</italic></source> <volume>57</volume> <fpage>573</fpage>&#x2013;<lpage>578</lpage>. <pub-id pub-id-type="doi">10.1211/0022357055966</pub-id> <pub-id pub-id-type="pmid">15901346</pub-id></citation></ref>
<ref id="B41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>C.</given-names></name> <name><surname>Sun</surname> <given-names>D.</given-names></name> <name><surname>Zhang</surname> <given-names>S.</given-names></name> <name><surname>Yang</surname> <given-names>S.</given-names></name> <name><surname>Alim</surname> <given-names>M. A.</given-names></name> <name><surname>Zhang</surname> <given-names>Q.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Genetic effects of FASN, PPARGC1A, ABCG2 and IGF1 revealing the association with milk fatty acids in a Chinese Holstein cattle population based on a post genome-wide association study.</article-title> <source><italic>BMC Genet.</italic></source> <volume>17</volume>:<issue>110</issue>. <pub-id pub-id-type="doi">10.1186/s12863-016-0418-x</pub-id> <pub-id pub-id-type="pmid">27468856</pub-id></citation></ref>
<ref id="B42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>H.</given-names></name></person-group> (<year>2013</year>). <article-title>Aligning sequence reads, clone sequences and assembly contigs with BWA-MEM.</article-title> <source><italic>arXiv</italic></source> <comment>[preprint]</comment> <volume>arXiv</volume>:<issue>1303.3997</issue></citation></ref>
<ref id="B43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Handsaker</surname> <given-names>B.</given-names></name> <name><surname>Wysoker</surname> <given-names>A.</given-names></name> <name><surname>Fennell</surname> <given-names>T.</given-names></name> <name><surname>Ruan</surname> <given-names>J.</given-names></name> <name><surname>Homer</surname> <given-names>N.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>The Sequence Alignment/Map format and SAMtools.</article-title> <source><italic>Bioinformatics</italic></source> <volume>25</volume> <fpage>2078</fpage>&#x2013;<lpage>2079</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp352</pub-id> <pub-id pub-id-type="pmid">19505943</pub-id></citation></ref>
<ref id="B44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Kim</surname> <given-names>S.-W.</given-names></name> <name><surname>Do</surname> <given-names>K.-T.</given-names></name> <name><surname>Ha</surname> <given-names>Y.-K.</given-names></name> <name><surname>Lee</surname> <given-names>Y.-M.</given-names></name> <name><surname>Yoon</surname> <given-names>S.-H.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>Analyses of porcine public SNPs in coding-gene regions by re-sequencing and phenotypic association studies.</article-title> <source><italic>Mol. Biol. Rep.</italic></source> <volume>38</volume> <fpage>3805</fpage>&#x2013;<lpage>3820</lpage>. <pub-id pub-id-type="doi">10.1007/s11033-010-0496-1</pub-id> <pub-id pub-id-type="pmid">21107721</pub-id></citation></ref>
<ref id="B45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Liu</surname> <given-names>X.</given-names></name> <name><surname>Qin</surname> <given-names>Z.</given-names></name> <name><surname>Wei</surname> <given-names>M.</given-names></name> <name><surname>Hou</surname> <given-names>X.</given-names></name> <name><surname>Zhang</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>A novel transcription factor Rwdd1 and its SUMOylation inhibit the expression of sqr, a key gene of mitochondrial sulfide metabolism in Urechis unicinctus.</article-title> <source><italic>Aquat. Toxicol.</italic></source> <volume>204</volume> <fpage>180</fpage>&#x2013;<lpage>189</lpage>. <pub-id pub-id-type="doi">10.1016/j.aquatox.2018.09.012</pub-id> <pub-id pub-id-type="pmid">30278355</pub-id></citation></ref>
<ref id="B46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Yang</surname> <given-names>J.</given-names></name> <name><surname>Shen</surname> <given-names>M.</given-names></name> <name><surname>Xie</surname> <given-names>X.-L.</given-names></name> <name><surname>Liu</surname> <given-names>G.-J.</given-names></name> <name><surname>Xu</surname> <given-names>Y.-X.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>Whole-genome resequencing of wild and domestic sheep identifies genes associated with morphological and agronomic traits.</article-title> <source><italic>Nat. Commun.</italic></source> <volume>11</volume>:<issue>2815</issue>. <pub-id pub-id-type="doi">10.1038/s41467-020-16485-1</pub-id> <pub-id pub-id-type="pmid">32499537</pub-id></citation></ref>
<ref id="B47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lizarraga</surname> <given-names>S. B.</given-names></name> <name><surname>Margossian</surname> <given-names>S. P.</given-names></name> <name><surname>Harris</surname> <given-names>M. H.</given-names></name> <name><surname>Campagna</surname> <given-names>D. R.</given-names></name> <name><surname>Han</surname> <given-names>A.-P.</given-names></name> <name><surname>Blevins</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2010</year>). <article-title>Cdk5rap2 regulates centrosome function and chromosome segregation in neuronal progenitors.</article-title> <source><italic>Development</italic></source> <volume>137</volume> <fpage>1907</fpage>&#x2013;<lpage>1917</lpage>. <pub-id pub-id-type="doi">10.1242/dev.040410</pub-id> <pub-id pub-id-type="pmid">20460369</pub-id></citation></ref>
<ref id="B48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ma</surname> <given-names>Y.</given-names></name> <name><surname>Ding</surname> <given-names>X.</given-names></name> <name><surname>Qanbari</surname> <given-names>S.</given-names></name> <name><surname>Weigend</surname> <given-names>S.</given-names></name> <name><surname>Zhang</surname> <given-names>Q.</given-names></name> <name><surname>Simianer</surname> <given-names>H.</given-names></name></person-group> (<year>2015</year>). <article-title>Properties of different selection signature statistics and a new strategy for combining them.</article-title> <source><italic>Heredity (Edinb)</italic></source> <volume>115</volume> <fpage>426</fpage>&#x2013;<lpage>436</lpage>. <pub-id pub-id-type="doi">10.1038/hdy.2015.42</pub-id> <pub-id pub-id-type="pmid">25990878</pub-id></citation></ref>
<ref id="B49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Marnetto</surname> <given-names>D.</given-names></name> <name><surname>Huerta-S&#x00E1;nchez</surname> <given-names>E.</given-names></name></person-group> (<year>2017</year>). <article-title>Haplostrips: revealing population structure through haplotype visualization.</article-title> <source><italic>Methods Ecol. Evol.</italic></source> <volume>8</volume> <fpage>1389</fpage>&#x2013;<lpage>1392</lpage>. <pub-id pub-id-type="doi">10.1111/2041-210X.12747</pub-id></citation></ref>
<ref id="B50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>McKenna</surname> <given-names>A.</given-names></name> <name><surname>Hanna</surname> <given-names>M.</given-names></name> <name><surname>Banks</surname> <given-names>E.</given-names></name> <name><surname>Sivachenko</surname> <given-names>A.</given-names></name> <name><surname>Cibulskis</surname> <given-names>K.</given-names></name> <name><surname>Kernytsky</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2010</year>). <article-title>The Genome Analysis Toolkit: a MapReduce framework for analyzing next-generation DNA sequencing data.</article-title> <source><italic>Genome Res.</italic></source> <volume>20</volume> <fpage>1297</fpage>&#x2013;<lpage>1303</lpage>. <pub-id pub-id-type="doi">10.1101/gr.107524.110</pub-id> <pub-id pub-id-type="pmid">20644199</pub-id></citation></ref>
<ref id="B51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Miyashita</surname> <given-names>H.</given-names></name> <name><surname>Watanabe</surname> <given-names>T.</given-names></name> <name><surname>Hayashi</surname> <given-names>H.</given-names></name> <name><surname>Suzuki</surname> <given-names>Y.</given-names></name> <name><surname>Nakamura</surname> <given-names>T.</given-names></name> <name><surname>Ito</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Angiogenesis inhibitor vasohibin-1 enhances stress resistance of endothelial cells via induction of SOD<sub>2</sub> and SIRT<sub>1</sub>.</article-title> <source><italic>PLoS ONE</italic></source> <volume>7</volume>, <fpage>e46459</fpage>&#x2013;<lpage>e46459</lpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0046459</pub-id> <pub-id pub-id-type="pmid">23056314</pub-id></citation></ref>
<ref id="B52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Naval-Sanchez</surname> <given-names>M.</given-names></name> <name><surname>Nguyen</surname> <given-names>Q.</given-names></name> <name><surname>McWilliam</surname> <given-names>S.</given-names></name> <name><surname>Porto-Neto</surname> <given-names>L. R.</given-names></name> <name><surname>Tellam</surname> <given-names>R.</given-names></name> <name><surname>Vuocolo</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Sheep genome functional annotation reveals proximal regulatory elements contributed to the evolution of modern breeds.</article-title> <source><italic>Nat. Commun.</italic></source> <volume>9</volume>:<issue>859</issue>. <pub-id pub-id-type="doi">10.1038/s41467-017-02809-1</pub-id> <pub-id pub-id-type="pmid">29491421</pub-id></citation></ref>
<ref id="B53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nei</surname> <given-names>M.</given-names></name> <name><surname>Li</surname> <given-names>W. H.</given-names></name></person-group> (<year>1979</year>). <article-title>Mathematical model for studying genetic variation in terms of restriction endonucleases.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>76</volume> <fpage>5269</fpage>&#x2013;<lpage>5273</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.76.10.5269</pub-id> <pub-id pub-id-type="pmid">291943</pub-id></citation></ref>
<ref id="B54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Olivier</surname> <given-names>M.</given-names></name> <name><surname>Hsiung</surname> <given-names>C. A.</given-names></name> <name><surname>Chuang</surname> <given-names>L.-M.</given-names></name> <name><surname>Ho</surname> <given-names>L.-T.</given-names></name> <name><surname>Ting</surname> <given-names>C.-T.</given-names></name> <name><surname>Bustos</surname> <given-names>V. I.</given-names></name><etal/></person-group> (<year>2004</year>). <article-title>Single nucleotide polymorphisms in protein tyrosine phosphatase 1beta (PTPN1) are associated with essential hypertension and obesity.</article-title> <source><italic>Hum. Mol. Genet.</italic></source> <volume>13</volume> <fpage>1885</fpage>&#x2013;<lpage>1892</lpage>. <pub-id pub-id-type="doi">10.1093/hmg/ddh196</pub-id> <pub-id pub-id-type="pmid">15229188</pub-id></citation></ref>
<ref id="B55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pasiakos</surname> <given-names>S.</given-names></name> <name><surname>Berryman</surname> <given-names>C.</given-names></name> <name><surname>Carrigan</surname> <given-names>C.</given-names></name> <name><surname>Young</surname> <given-names>A.</given-names></name> <name><surname>Carbone</surname> <given-names>J.</given-names></name></person-group> (<year>2017</year>). <article-title>Muscle protein turnover and the molecular regulation of muscle mass during hypoxia.</article-title> <source><italic>Med. Sci. Sport. Exerc.</italic></source> <volume>49</volume> <fpage>1340</fpage>&#x2013;<lpage>1350</lpage>. <pub-id pub-id-type="doi">10.1249/mss.0000000000001228</pub-id> <pub-id pub-id-type="pmid">28166119</pub-id></citation></ref>
<ref id="B56"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Periasamy</surname> <given-names>K.</given-names></name> <name><surname>Pichler</surname> <given-names>R.</given-names></name> <name><surname>Poli</surname> <given-names>M.</given-names></name> <name><surname>Cristel</surname> <given-names>S.</given-names></name> <name><surname>Cetr&#x00E1;</surname> <given-names>B.</given-names></name> <name><surname>Medus</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Candidate gene approach for parasite resistance in sheep&#x2013;variation in immune pathway genes and association with fecal egg count.</article-title> <source><italic>PLoS One</italic></source> <volume>9</volume>:<issue>e88337</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0088337</pub-id> <pub-id pub-id-type="pmid">24533078</pub-id></citation></ref>
<ref id="B57"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Prades</surname> <given-names>C.</given-names></name> <name><surname>Arnould</surname> <given-names>I.</given-names></name> <name><surname>Annilo</surname> <given-names>T.</given-names></name> <name><surname>Shulenin</surname> <given-names>S.</given-names></name> <name><surname>Chen</surname> <given-names>Z. Q.</given-names></name> <name><surname>Orosco</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2002</year>). <article-title>The human ATP binding cassette gene ABCA13, located on chromosome 7p12.3, encodes a 5058 amino acid protein with an extracellular domain encoded in part by a 4.8-kb conserved exon.</article-title> <source><italic>Cytogenet. Genome Res.</italic></source> <volume>98</volume> <fpage>160</fpage>&#x2013;<lpage>168</lpage>. <pub-id pub-id-type="doi">10.1159/000069852</pub-id> <pub-id pub-id-type="pmid">12697998</pub-id></citation></ref>
<ref id="B58"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pszczola</surname> <given-names>M.</given-names></name> <name><surname>Strabel</surname> <given-names>T.</given-names></name> <name><surname>Mucha</surname> <given-names>S.</given-names></name> <name><surname>Sell-Kubiak</surname> <given-names>E.</given-names></name></person-group> (<year>2018</year>). <article-title>Genome-wide association identifies methane production level relation to genetic control of digestive tract development in dairy cows.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>8</volume>:<issue>15164</issue>. <pub-id pub-id-type="doi">10.1038/s41598-018-33327-9</pub-id> <pub-id pub-id-type="pmid">30310168</pub-id></citation></ref>
<ref id="B59"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Purcell</surname> <given-names>S.</given-names></name> <name><surname>Neale</surname> <given-names>B.</given-names></name> <name><surname>Todd-Brown</surname> <given-names>K.</given-names></name> <name><surname>Thomas</surname> <given-names>L.</given-names></name> <name><surname>Ferreira</surname> <given-names>M. A. R.</given-names></name> <name><surname>Bender</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2007</year>). <article-title>PLINK: a tool set for whole-genome association and population-based linkage analyses.</article-title> <source><italic>Am. J. Hum. Genet.</italic></source> <volume>81</volume> <fpage>559</fpage>&#x2013;<lpage>575</lpage>. <pub-id pub-id-type="doi">10.1086/519795</pub-id> <pub-id pub-id-type="pmid">17701901</pub-id></citation></ref>
<ref id="B60"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rahman</surname> <given-names>M. M.</given-names></name> <name><surname>Bagdassarian</surname> <given-names>E.</given-names></name> <name><surname>Ali</surname> <given-names>M. A. M.</given-names></name> <name><surname>McFadden</surname> <given-names>G.</given-names></name></person-group> (<year>2017</year>). <article-title>Identification of host DEAD-box RNA helicases that regulate cellular tropism of oncolytic Myxoma virus in human cancer cells.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>7</volume>:<issue>15710</issue>. <pub-id pub-id-type="doi">10.1038/s41598-017-15941-1</pub-id> <pub-id pub-id-type="pmid">29146961</pub-id></citation></ref>
<ref id="B61"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ryder</surname> <given-names>M.</given-names></name></person-group> (<year>1964</year>). <article-title>The history of sheep breeds in Britain.</article-title> <source><italic>Agric. Hist. Rev.</italic></source> <volume>12</volume> <fpage>1</fpage>&#x2013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.2307/40273081</pub-id></citation></ref>
<ref id="B62"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Scheet</surname> <given-names>P.</given-names></name> <name><surname>Stephens</surname> <given-names>M.</given-names></name></person-group> (<year>2006</year>). <article-title>A fast and flexible statistical model for large-scale population genotype data: applications to inferring missing genotypes and haplotypic phase.</article-title> <source><italic>Am. J. Hum. Genet.</italic></source> <volume>78</volume> <fpage>629</fpage>&#x2013;<lpage>644</lpage>. <pub-id pub-id-type="doi">10.1086/502802</pub-id> <pub-id pub-id-type="pmid">16532393</pub-id></citation></ref>
<ref id="B63"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stronen</surname> <given-names>A. V.</given-names></name> <name><surname>Pertoldi</surname> <given-names>C.</given-names></name> <name><surname>Iacolina</surname> <given-names>L.</given-names></name> <name><surname>Kadarmideen</surname> <given-names>H. N.</given-names></name> <name><surname>Kristensen</surname> <given-names>T. N.</given-names></name></person-group> (<year>2019</year>). <article-title>Genomic analyses suggest adaptive differentiation of northern European native cattle breeds.</article-title> <source><italic>Evol. Appl.</italic></source> <volume>12</volume> <fpage>1096</fpage>&#x2013;<lpage>1113</lpage>. <pub-id pub-id-type="doi">10.1111/eva.12783</pub-id> <pub-id pub-id-type="pmid">31293626</pub-id></citation></ref>
<ref id="B64"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sweet-Jones</surname> <given-names>J.</given-names></name> <name><surname>Yurchenko</surname> <given-names>A. A.</given-names></name> <name><surname>Igoshin</surname> <given-names>A. V.</given-names></name> <name><surname>Yudin</surname> <given-names>N. S.</given-names></name> <name><surname>Swain</surname> <given-names>M. T.</given-names></name> <name><surname>Larkin</surname> <given-names>D. M.</given-names></name></person-group> (<year>2021</year>). <article-title>Resequencing and signatures of selection scan in two Siberian native sheep breeds point to candidate genetic variants for adaptation and economically important traits.</article-title> <source><italic>Anim. Genet.</italic></source> <volume>52</volume> <fpage>126</fpage>&#x2013;<lpage>131</lpage>. <pub-id pub-id-type="doi">10.1111/age.13015</pub-id> <pub-id pub-id-type="pmid">33107621</pub-id></citation></ref>
<ref id="B65"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tajima</surname> <given-names>F.</given-names></name></person-group> (<year>1989</year>). <article-title>Statistical method for testing the neutral mutation hypothesis by DNA polymorphism.</article-title> <source><italic>Genetics</italic></source> <volume>123</volume> <fpage>585</fpage>&#x2013;<lpage>595</lpage>. <pub-id pub-id-type="doi">10.1093/genetics/123.3.585</pub-id></citation></ref>
<ref id="B66"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Takasuga</surname> <given-names>A.</given-names></name> <name><surname>Sato</surname> <given-names>K.</given-names></name> <name><surname>Nakamura</surname> <given-names>R.</given-names></name> <name><surname>Saito</surname> <given-names>Y.</given-names></name> <name><surname>Sasaki</surname> <given-names>S.</given-names></name> <name><surname>Tsuji</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Non-synonymous FGD3 variant as positional candidate for disproportional tall stature accounting for a carcass weight QTL (CW-3) and skeletal dysplasia in Japanese Black cattle.</article-title> <source><italic>PLoS Genet.</italic></source> <volume>11</volume>:<issue>e1005433</issue>. <pub-id pub-id-type="doi">10.1371/journal.pgen.1005433</pub-id> <pub-id pub-id-type="pmid">26306008</pub-id></citation></ref>
<ref id="B67"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Takeda</surname> <given-names>E.</given-names></name> <name><surname>Suzuki</surname> <given-names>Y.</given-names></name> <name><surname>Sato</surname> <given-names>Y.</given-names></name></person-group> (<year>2016</year>). <article-title>Age-associated downregulation of vasohibin-1 in vascular endothelial cells.</article-title> <source><italic>Aging Cell</italic></source> <volume>15</volume> <fpage>885</fpage>&#x2013;<lpage>892</lpage>. <pub-id pub-id-type="doi">10.1111/acel.12497</pub-id> <pub-id pub-id-type="pmid">27325558</pub-id></citation></ref>
<ref id="B68"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tollenaere</surname> <given-names>M. A. X.</given-names></name> <name><surname>Tiedje</surname> <given-names>C.</given-names></name> <name><surname>Rasmussen</surname> <given-names>S.</given-names></name> <name><surname>Nielsen</surname> <given-names>J. C.</given-names></name> <name><surname>Vind</surname> <given-names>A. C.</given-names></name> <name><surname>Blasius</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>GIGYF1/2-driven cooperation between ZNF598 and TTP in posttranscriptional regulation of inflammatory signaling.</article-title> <source><italic>Cell Rep.</italic></source> <volume>26</volume>, <fpage>3511</fpage>&#x2013;<lpage>3521.e4</lpage>. <pub-id pub-id-type="doi">10.1016/j.celrep.2019.03.006</pub-id> <pub-id pub-id-type="pmid">30917308</pub-id></citation></ref>
<ref id="B69"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Turner</surname> <given-names>S. D.</given-names></name></person-group> (<year>2014</year>). <article-title>qqman: an R package for visualizing GWAS results using Q-Q and manhattan plots.</article-title> <source><italic>bioRxiv</italic></source> <comment>[preprint]</comment> <pub-id pub-id-type="doi">10.1101/005165</pub-id> <volume>bioRxiv</volume> <issue>005165</issue>.</citation></ref>
<ref id="B70"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>W.</given-names></name> <name><surname>Zhang</surname> <given-names>X.</given-names></name> <name><surname>Zhou</surname> <given-names>X.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name> <name><surname>La</surname> <given-names>Y.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Deep Genome resequencing reveals artificial and natural selection for visual deterioration, plateau adaptability and high prolificacy in Chinese domestic sheep.</article-title> <source><italic>Front. Genet.</italic></source> <volume>10</volume>:<issue>300</issue>. <pub-id pub-id-type="doi">10.3389/fgene.2019.00300</pub-id> <pub-id pub-id-type="pmid">31001329</pub-id></citation></ref>
<ref id="B71"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Weatherhead</surname> <given-names>B.</given-names></name> <name><surname>Logan</surname> <given-names>A. N. N.</given-names></name></person-group> (<year>1981</year>). <article-title>Interaction of &#x03B1;-melanocyte-stimulating hormone, melatonin, cyclin AMP and cyclic GMP in the control of melanogenesis in hair follicle melanocytes in vitro.</article-title> <source><italic>J. Endocrinol.</italic></source> <volume>90</volume> <fpage>89</fpage>&#x2013;<lpage>96</lpage>. <pub-id pub-id-type="doi">10.1677/joe.0.0900089</pub-id> <pub-id pub-id-type="pmid">6267154</pub-id></citation></ref>
<ref id="B72"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wei</surname> <given-names>C.</given-names></name> <name><surname>Wang</surname> <given-names>H.</given-names></name> <name><surname>Liu</surname> <given-names>G.</given-names></name> <name><surname>Wu</surname> <given-names>M.</given-names></name> <name><surname>Cao</surname> <given-names>J.</given-names></name> <name><surname>Liu</surname> <given-names>Z.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Genome-wide analysis reveals population structure and selection in Chinese indigenous sheep breeds.</article-title> <source><italic>BMC Genomics</italic></source> <volume>16</volume>:<issue>194</issue>. <pub-id pub-id-type="doi">10.1186/s12864-015-1384-9</pub-id> <pub-id pub-id-type="pmid">25888314</pub-id></citation></ref>
<ref id="B73"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Weir</surname> <given-names>B. S.</given-names></name> <name><surname>Cockerham</surname> <given-names>C. C.</given-names></name></person-group> (<year>1984</year>). <article-title>Estimating F-statistics for the analysis of population structure.</article-title> <source><italic>Evolution (N. Y)</italic></source> <volume>38</volume> <fpage>1358</fpage>&#x2013;<lpage>1370</lpage>. <pub-id pub-id-type="doi">10.2307/2408641</pub-id></citation></ref>
<ref id="B74"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Williams-Davies</surname> <given-names>J.</given-names></name></person-group> (<year>1981</year>). <source><italic>Welsh Sheep and Their Wool</italic></source>, <edition>1st Edn</edition>. <publisher-loc>Dyfed</publisher-loc>: <publisher-name>Gormer Press</publisher-name>.</citation></ref>
<ref id="B75"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yan</surname> <given-names>K.</given-names></name> <name><surname>Gao</surname> <given-names>L.-N.</given-names></name> <name><surname>Cui</surname> <given-names>Y.-L.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name> <name><surname>Zhou</surname> <given-names>X.</given-names></name></person-group> (<year>2016</year>). <article-title>The cyclic AMP signalling pathway: Exploring targets for successful drug discovery (Review).</article-title> <source><italic>Mol. Med. Rep.</italic></source> <volume>13</volume> <fpage>3715</fpage>&#x2013;<lpage>3723</lpage>. <pub-id pub-id-type="doi">10.3892/mmr.2016.5005</pub-id> <pub-id pub-id-type="pmid">27035868</pub-id></citation></ref>
<ref id="B76"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>G.-L.</given-names></name> <name><surname>Fu</surname> <given-names>D.-L.</given-names></name> <name><surname>Lang</surname> <given-names>X.</given-names></name> <name><surname>Wang</surname> <given-names>Y.-T.</given-names></name> <name><surname>Cheng</surname> <given-names>S.-R.</given-names></name> <name><surname>Fang</surname> <given-names>S.-L.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Mutations in MC1R gene determine black coat color phenotype in Chinese sheep.</article-title> <source><italic>Sci. World J.</italic></source> <volume>2013</volume>:<issue>675382</issue>. <pub-id pub-id-type="doi">10.1155/2013/675382</pub-id> <pub-id pub-id-type="pmid">24082855</pub-id></citation></ref>
<ref id="B77"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>J.</given-names></name> <name><surname>Li</surname> <given-names>W.-R.</given-names></name> <name><surname>Lv</surname> <given-names>F.-H.</given-names></name> <name><surname>He</surname> <given-names>S.-G.</given-names></name> <name><surname>Tian</surname> <given-names>S.-L.</given-names></name> <name><surname>Peng</surname> <given-names>W.-F.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Whole-Genome sequencing of native sheep provides insights into rapid adaptations to extreme environments.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>33</volume> <fpage>2576</fpage>&#x2013;<lpage>2592</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msw129</pub-id> <pub-id pub-id-type="pmid">27401233</pub-id></citation></ref>
<ref id="B78"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yuan</surname> <given-names>Z.</given-names></name> <name><surname>Li</surname> <given-names>W.</given-names></name> <name><surname>Li</surname> <given-names>F.</given-names></name> <name><surname>Yue</surname> <given-names>X.</given-names></name></person-group> (<year>2019</year>). <article-title>Selection signature analysis reveals genes underlying sheep milking performance.</article-title> <source><italic>Arch. Anim. Breed.</italic></source> <volume>62</volume> <fpage>501</fpage>&#x2013;<lpage>508</lpage>. <pub-id pub-id-type="doi">10.5194/aab-62-501-2019</pub-id> <pub-id pub-id-type="pmid">31807661</pub-id></citation></ref>
<ref id="B79"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yurchenko</surname> <given-names>A. A.</given-names></name> <name><surname>Deniskova</surname> <given-names>T. E.</given-names></name> <name><surname>Yudin</surname> <given-names>N. S.</given-names></name> <name><surname>Dotsev</surname> <given-names>A. V.</given-names></name> <name><surname>Khamiruev</surname> <given-names>T. N.</given-names></name> <name><surname>Selionova</surname> <given-names>M. I.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>High-density genotyping reveals signatures of selection related to acclimation and economically important traits in 15 local sheep breeds from Russia.</article-title> <source><italic>BMC Genomics</italic></source> <volume>20</volume>:<issue>294</issue>. <pub-id pub-id-type="doi">10.1186/s12864-019-5537-0</pub-id> <pub-id pub-id-type="pmid">32039702</pub-id></citation></ref>
<ref id="B80"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zeder</surname> <given-names>M. A.</given-names></name></person-group> (<year>2008</year>). <article-title>Domestication and early agriculture in the Mediterranean Basin: origins, diffusion, and impact.</article-title> <source><italic>Proc. Natl. Acad. Sci.</italic></source> <volume>105</volume> <fpage>11597</fpage>&#x2013;<lpage>11604</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0801317105</pub-id> <pub-id pub-id-type="pmid">18697943</pub-id></citation></ref>
</ref-list><fn-group>
<fn id="footnote1">
<label>1</label>
<p><ext-link ext-link-type="uri" xlink:href="http://broadinstitute.github.io/picard/">http://broadinstitute.github.io/picard/</ext-link></p></fn>
</fn-group>
</back>
</article>
