<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1384973</article-id>
<article-id pub-id-type="doi">10.3389/fgene.2024.1384973</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Optimizing purebred selection to improve crossbred performance</article-title>
<alt-title alt-title-type="left-running-head">Barani et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fgene.2024.1384973">10.3389/fgene.2024.1384973</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Barani</surname>
<given-names>Somayeh</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2654637/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Miraie Ashtiani</surname>
<given-names>Sayed Reza</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2653916/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Nejati Javaremi</surname>
<given-names>Ardeshir</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/457923/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Khansefid</surname>
<given-names>Majid</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1067958/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Esfandyari</surname>
<given-names>Hadi</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/891530/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Animal Science</institution>, <institution>Faculty of Agriculture, College of Agriculture and Natural Resources</institution>, <institution>University of Tehran</institution>, <addr-line>Karaj</addr-line>, <country>Iran</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Agriculture Victoria Research, AgriBio</institution>, <institution>Centre for AgriBioscience</institution>, <addr-line>Bundoora</addr-line>, <addr-line>VIC</addr-line>, <country>Australia</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>School of Applied Systems Biology</institution>, <institution>La Trobe University</institution>, <addr-line>Bundoora</addr-line>, <addr-line>VIC</addr-line>, <country>Australia</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Qualitas</institution>, <addr-line>Zug</addr-line>, <country>Switzerland</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/212867/overview">Lingyang Xu</ext-link>, Institute of Animal Sciences, China</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1346213/overview">Sabyasachi Mukherjee</ext-link>, Indian Council of Agricultural Research (ICAR), India</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/401936/overview">Mohammad Hossein Banabazi</ext-link>, Swedish University of Agricultural Sciences, Sweden</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Sayed Reza Miraie Ashtiani, <email>ashtiani@ut.ac.ir</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>24</day>
<month>09</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>15</volume>
<elocation-id>1384973</elocation-id>
<history>
<date date-type="received">
<day>11</day>
<month>02</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>29</day>
<month>08</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Barani, Miraie Ashtiani, Nejati Javaremi, Khansefid and Esfandyari.</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Barani, Miraie Ashtiani, Nejati Javaremi, Khansefid and Esfandyari</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Crossbreeding is a widely adopted practice in the livestock industry, leveraging the advantages of heterosis and breed complementarity. The prediction of Crossbred Performance (CP) often relies on Purebred Performance (PB) due to limited crossbred data availability. However, the effective selection of purebred parents for enhancing CP depends on non-additive genetic effects and environmental factors. These factors are encapsulated in the genetic correlation between crossbred and purebred populations (<inline-formula id="inf1">
<mml:math id="m1">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>). In this study, a two-way crossbreeding simulation was employed to investigate various strategies for integrating data from purebred and crossbred populations. The goal was to identify optimal models that maximize CP across different levels of <inline-formula id="inf2">
<mml:math id="m2">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. Different scenarios involving the selection of genotyped individuals from purebred and crossbred populations were explored using ssGBLUP (single-step Genomic Best Linear Unbiased Prediction) and ssGBLUP-MF (ssGBLUP with metafounders) models. The findings revealed an increase in prediction accuracy across all scenarios as <inline-formula id="inf3">
<mml:math id="m3">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> values increased. Notably, in the scenario incorporating genotypes from both purebred parent breeds and their crossbreds, both ssGBLUP and ssGBLUP-MF models exhibited nearly identical predictive accuracy. This scenario achieved maximum accuracy when <inline-formula id="inf4">
<mml:math id="m4">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> was less than 0.5. However, at <inline-formula id="inf5">
<mml:math id="m5">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> &#x3d; 0.8, ssGBLUP, which exclusively included sire breed genotypes in the training set, achieved the highest overall prediction accuracy at 73.2%. In comparison, the BLUP-UPG (BLUP with unknown parent group) model demonstrated lower accuracy than ssGBLUP and ssGBLUP-MF across all <inline-formula id="inf6">
<mml:math id="m6">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> levels. Although ssGBLUP and ssGBLUP-MF did not demonstrate a definitive trend in their respective scenarios, the prediction ability for CP increased when incorporating both crossbred and purebred population genotypes at lower levels of <inline-formula id="inf7">
<mml:math id="m7">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. Furthermore, when <inline-formula id="inf8">
<mml:math id="m8">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> was high, utilizing paternal genotype for CP predictions emerged as the most effective strategy. Predicted dispersion remained relatively similar in all scenarios, indicating a slight underestimation of breeding values. Overall, the <inline-formula id="inf9">
<mml:math id="m9">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> value emerged as a critical factor in predicting CP based on purebred data. However, the optimal model to maximize CP depends on the factors influencing <inline-formula id="inf10">
<mml:math id="m10">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. Consequently, ongoing research aims to develop models that optimize purebred selection, further enhancing CP.</p>
</abstract>
<kwd-group>
<kwd>crossbred performance</kwd>
<kwd>genetic correlation between crossbred and purebred populations</kwd>
<kwd>unknown parent group</kwd>
<kwd>metafounders. ssGBLUP</kwd>
<kwd>SSGblup</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Livestock Genomics</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Crossbreeding in livestock and poultry breeding is used to maximize crossbred performance (CP) through benefiting from heterosis and breed complementarity. Genetic evaluation in the crossbreeding system is usually based on phenotypes and genotypes of purebred parents, which in fact leads to the selection of the best purebred parents in the pure populations. However, the best pure parents will not necessarily produce the optimal crossbred progenies, which means the performance of purebred parents is not the best predictor for CP (<xref ref-type="bibr" rid="B10">Esfandyari et al., 2015</xref>). Ideally, crossbred data should be used rather than purebred data which can lead to a more significant improvement in CP; nevertheless, gathering data from commercial populations can be challenging and expensive (<xref ref-type="bibr" rid="B31">Wei and van der Werf, 1994</xref>). Therefore, animal breeders inevitably utilize the performance of purebred parents to predict the CP.</p>
<p>The genetic correlation (<inline-formula id="inf11">
<mml:math id="m11">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>) between purebred and crossbred populations is a pivotal factor influencing the accuracy of predicting CP based on purebred data (<xref ref-type="bibr" rid="B16">Legarra et al., 2009</xref>). The value of <inline-formula id="inf12">
<mml:math id="m12">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is shaped by various factors, including, (i) Genotype by genotype interaction (G &#xd7; G); Arising from differing allelic frequencies of causal variants in purebred and crossbred populations (<xref ref-type="bibr" rid="B7">Christensen and Lund, 2010</xref>). (ii) Genotype by environment interaction (G &#xd7; E); Resulting from environmental disparities between the two populations. (iii) Incompatibility of measured traits; Present in purebred and crossbred populations (<xref ref-type="bibr" rid="B5">Christensen, 2012</xref>). These factors, coupled with non-additive genetic effects, particularly dominance effects, can lead to deviations in <inline-formula id="inf13">
<mml:math id="m13">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> from 1. When <inline-formula id="inf14">
<mml:math id="m14">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> deviates from 1, utilizing purebred performance (PB) to assess crossbreds may hinder the rate of improvement in CP. Research suggests that if this deviation is attributable to dominance effects, implementing a dominance model can enhance the prediction accuracy of CP when the reference comprises purebred populations (<xref ref-type="bibr" rid="B17">Legarra et al., 2015</xref>). However, in practice, deviations in <inline-formula id="inf15">
<mml:math id="m15">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> from 1 stem from multiple factors mentioned earlier.</p>
<p>Another challenge in predicting CP is the low genetic relatedness between parental breeds, despite their shared common ancestors several generations ago. Addressing these complexities is crucial for refining predictive models and advancing the accuracy of CP evaluations based on purebred data.</p>
<p>In recent years, single-step genomic BLUP (ssGBLUP) has significantly increased the accuracy of breeding value estimation by blending marker and pedigree information of both genotyped and ungenotyped animals (<xref ref-type="bibr" rid="B16">Legarra et al., 2009</xref>; <xref ref-type="bibr" rid="B7">Christensen and Lund, 2010</xref>). However, the main remaining challenge is how to combine pedigree-based and genomic relationships, given the base population does not have pedigree or genotype information. In the same vein, Christensen constructed the marker-based relationship matrix by assuming that all allele frequencies equal to 0.5 and base animals are related and inbred (<xref ref-type="bibr" rid="B5">Christensen, 2012</xref>). Subsequently, <xref ref-type="bibr" rid="B17">Legarra et al. (2015)</xref> proposed a comprehensive theoretical framework for incorporating relatedness within and across founders into a base relationship matrix, using the concept of metafounders (MFs). The base animals assumed to be related, so in ssGBLUP with metafounders (ssGBLUP-MF), matrix G is constructed with all allele frequencies equal to 0.5. Consequently, the founders of the breeds are related to a common ancestor, represented by the matrix &#x393; which describes the relationship of the founders (<xref ref-type="bibr" rid="B17">Legarra et al., 2015</xref>).</p>
<p>Motivated by the challenges inherent in predicting CP, this paper strives to pinpoint the optimal strategy for integrating data and selecting the most suitable model to maximize CP at various levels of <inline-formula id="inf16">
<mml:math id="m16">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. This objective remains irrespective of the factors causing deviations in <inline-formula id="inf17">
<mml:math id="m17">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> from 1.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>2 Materials and methods</title>
<sec id="s2-1">
<title>2.1 Simulation</title>
<p>The simulation was conducted in two parts. The first part was focused on generating datasets of purebred and crossbred animals for a single trait with a heritability of 0.3 using the QMSim software (<xref ref-type="bibr" rid="B27">Sargolzaei and Schenkel, 2009</xref>). In the initial phase of the simulation, a historical population of 5,000 founders was simulated for 1,000 generations with a constant population size of 5,000. This step aimed to establish genetic drift and linkage disequilibrium (LD) between markers and causal variants. Subsequently, the population size was gradually reduced from 5,000 to 2000 individuals over an additional 1,500 generations. After that, the population size was considered steady during the last 500 generations. To create two breeds (breeds A and B), two random samples of 50 males and 500 females were taken from the last generation of the historical population (the first bottleneck), then the population size was expanded over the next 200 generations. Simulating various population sizes and dynamics across generations aids in comprehending the impact of genetic drift, selection, and other evolutionary forces. The initial step involved simulating linkage disequilibrium between markers and causal variants. The subsequent step consisted of simulating a gradual reduction in population size resulting from domestication and other minor bottleneck events (<xref ref-type="bibr" rid="B4">Brito et al., 2011</xref>). The final step entailed creating two separate breeds. In this step, to simulate the sheep breeding system, we implemented random mating with 5 descendants per dam considering 1/2 of the twining average and 4 parturitions per generation. In the next step, the second bottleneck was simulated by selecting two random samples (100 males and 1,000 females) from the last generation of the breeds A and B to generate the recent populations of the breeds (called expanding A and B). In this step, breeding values were estimated based on best liner unbiased prediction (BLUP) method. The next generations were simulated by imposing a replacement rate of 20% for dams and 50% for sires. The culling and selection designs were contingent on age and high estimated breeding value, respectively. The breeding scheme in this step was continued for 10 generations. Then crossbred animals (F1) were produced from crossing between males from expanding A and females from expanding B populations. We simulated three crossbred populations (F1) that were generated from generations 8, 9, and 10 (<xref ref-type="fig" rid="F1">Figure 1</xref>).</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Schematic representation of the simulated population. A (paternal line) and B (maternal line) are purebred populations. <inline-formula id="inf18">
<mml:math id="m18">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>A</mml:mi>
<mml:mi>B</mml:mi>
</mml:mrow>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula id="inf19">
<mml:math id="m19">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>A</mml:mi>
<mml:mi>B</mml:mi>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, and <inline-formula id="inf20">
<mml:math id="m20">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>A</mml:mi>
<mml:mi>B</mml:mi>
</mml:mrow>
<mml:mn>3</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are crossbred populations that are derived from generations (GEN) 8, 9 and 10 of expanded (EXP) purebred populations A and B.</p>
</caption>
<graphic xlink:href="fgene-15-1384973-g001.tif"/>
</fig>
<p>Genome structure was simulated with 26 autosomal chromosomes and a total length of 3,421 centimorgan (cM) similar to the sheep genome size estimated by <xref ref-type="bibr" rid="B24">Prieur et al. (2017)</xref>. We simulated 50K single nucleotide polymorphisms (SNP) and 500 quantitative trait loci (QTLs) randomly scattered across the whole genome. Minor allele frequencies (MAF) of markers were assumed to be upper than 0.05 and mutation rates of the SNPs and QTL was <inline-formula id="inf21">
<mml:math id="m21">
<mml:mrow>
<mml:mn>2.5</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:msup>
<mml:mn>10</mml:mn>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>5</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>. The QTL allele effects were inferred from a Gamma distribution with <inline-formula id="inf22">
<mml:math id="m22">
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0.4</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> (summarized in <xref ref-type="table" rid="T1">Table 1</xref>). True breeding values (TBVs) were obtained from the sum of the additive effect of QTL. The phenotypes were calculated based on the additive genetic and residual effects. Subsequently, we measured the fixation index (<inline-formula id="inf23">
<mml:math id="m23">
<mml:mrow>
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>) and performed the principal component analysis (PCA) to assess the population structure and distinctness of the three populations. The <inline-formula id="inf24">
<mml:math id="m24">
<mml:mrow>
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is a measure of population differentiation due to genetic structure (<xref ref-type="bibr" rid="B21">Nagylaki, 1998</xref>). PCA is a multivariate analysis that reduces the dimensionality of the data while preserving their covariance which we applied to find the eigenvalues and eigenvectors of the covariance matrix of allele frequencies (<xref ref-type="bibr" rid="B25">Reich et al., 2008</xref>).</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>The parameters used for simulating trait and genome.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Item</th>
<th align="left">Value</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Heritability (h<sup>2</sup>)</td>
<td align="left">0.3</td>
</tr>
<tr>
<td align="left">Genome size</td>
<td align="left">3,421&#xa0;cM</td>
</tr>
<tr>
<td align="left">Number of chromosomes</td>
<td align="left">26</td>
</tr>
<tr>
<td align="left">Number of markers</td>
<td align="left">50,000</td>
</tr>
<tr>
<td align="left">Number of QTL</td>
<td align="left">500</td>
</tr>
<tr>
<td align="left">Mutation rate in QTL and markers</td>
<td align="left">2.5 &#xd7; 10<sup>&#x2212;5</sup>
</td>
</tr>
<tr>
<td align="left">Minor allele frequency in QTL and markers</td>
<td align="left">0.05</td>
</tr>
<tr>
<td align="left">Distribution of additive QTL effects</td>
<td align="left">Gamma (&#x3b1; &#x3d; 0.4, 1.66)</td>
</tr>
<tr>
<td align="left">Additive genetic correlation between purebred and crossbred populations (<inline-formula id="inf25">
<mml:math id="m25">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>)</td>
<td align="left">0.2, 0.5 or 0.8</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>In the second part of the simulation, to investigate the impact of <inline-formula id="inf26">
<mml:math id="m26">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> on the identification of optimal and cost-efficient strategies for improving CP, three levels of <inline-formula id="inf27">
<mml:math id="m27">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> (low, medium, and high, corresponding to 0.2, 0.5, and 0.8, respectively) were simulated using the BGLR and MASS packages in R (<xref ref-type="bibr" rid="B26">Ripley et al., 2013</xref>; <xref ref-type="bibr" rid="B23">P&#xe9;rez and de Los Campos, 2014</xref>). To simulate the <inline-formula id="inf28">
<mml:math id="m28">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> levels, the additive effects of purebreds and crossbreds were simulated using a multivariate normal distribution with mean 0 and a positive-definite symmetric matrix specifying the covariance matrix of the variables, according to the desired levels of <inline-formula id="inf29">
<mml:math id="m29">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and the effects of QTLs. Therefore the <inline-formula id="inf30">
<mml:math id="m30">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="bold-italic">r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi mathvariant="bold-italic">c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is defined as follows (<xref ref-type="bibr" rid="B11">Falconer, 1996</xref>):<disp-formula id="equ1">
<mml:math id="m31">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi mathvariant="bold-italic">c</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3c3;</mml:mi>
<mml:msub>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">P</mml:mi>
<mml:mi mathvariant="bold-italic">B</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="bold-italic">C</mml:mi>
<mml:mi mathvariant="bold-italic">B</mml:mi>
</mml:mrow>
</mml:msub>
</mml:msub>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3c3;</mml:mi>
<mml:msub>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">P</mml:mi>
<mml:mi mathvariant="bold-italic">B</mml:mi>
</mml:mrow>
</mml:msub>
</mml:msub>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3c3;</mml:mi>
<mml:msub>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">C</mml:mi>
<mml:mi mathvariant="bold-italic">B</mml:mi>
</mml:mrow>
</mml:msub>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf31">
<mml:math id="m32">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3c3;</mml:mi>
<mml:msub>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">P</mml:mi>
<mml:mi mathvariant="bold-italic">B</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="bold-italic">C</mml:mi>
<mml:mi mathvariant="bold-italic">B</mml:mi>
</mml:mrow>
</mml:msub>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the additive genetic covariance between PB and CB performance, and <inline-formula id="inf32">
<mml:math id="m33">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3c3;</mml:mi>
<mml:msub>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">P</mml:mi>
<mml:mi mathvariant="bold-italic">B</mml:mi>
</mml:mrow>
</mml:msub>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf33">
<mml:math id="m34">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3c3;</mml:mi>
<mml:msub>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">C</mml:mi>
<mml:mi mathvariant="bold-italic">B</mml:mi>
</mml:mrow>
</mml:msub>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are the additive genetic standard deviation in purebred and crossbred populations, respectively.</p>
<p>We conducted the population simulation 10 times and subsequently performed a comparative analysis of the predictive abilities of three methods: BLUP-UPG (BLUP with unknown parent group), ssGBLUP, and ssGBLUP-MF methods. The breeding values were estimated based on the same pedigree and data file, considering four scenarios of genotype selection from purebred and crossbred populations: SC1: breeds A, B and crossbreds, SC2: breeds A and B, SC3: breed A and SC4: breed B population.</p>
</sec>
<sec id="s2-2">
<title>2.2 Data analysis</title>
<p>Three prediction models were used to calculate breeding values: BLUP-UPG, ssGBLUP, and ssGBLUP-MF. The generation 0 produced after the second bottleneck was assumed to be the base population (i.e., only the pedigree information after generation 0 was used to predict breeding values). For the ssGBLUP and ssGBLUP-MF models, we explored various scenarios for including genotypes from both purebred and crossbred populations. The statistical model was as follows:<disp-formula id="equ2">
<mml:math id="m35">
<mml:mrow>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mi mathvariant="bold-italic">X</mml:mi>
<mml:mi mathvariant="bold-italic">b</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi mathvariant="bold-italic">Z</mml:mi>
<mml:mi mathvariant="bold-italic">u</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi mathvariant="bold-italic">e</mml:mi>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf34">
<mml:math id="m36">
<mml:mrow>
<mml:mi mathvariant="bold-italic">y</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the vector of phenotypes, <inline-formula id="inf35">
<mml:math id="m37">
<mml:mrow>
<mml:mi mathvariant="bold-italic">b</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the vector of fixed effects (breed, sex, and generation) and <inline-formula id="inf36">
<mml:math id="m38">
<mml:mrow>
<mml:mi mathvariant="bold-italic">u</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the vector of additive genetic effects distributed as <inline-formula id="inf37">
<mml:math id="m39">
<mml:mrow>
<mml:mi mathvariant="bold-italic">u</mml:mi>
<mml:mo>&#x223c;</mml:mo>
<mml:mi mathvariant="bold-italic">N</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mn mathvariant="bold">0</mml:mn>
<mml:mo>,</mml:mo>
<mml:msubsup>
<mml:mi mathvariant="bold-italic">&#x3c3;</mml:mi>
<mml:mi mathvariant="bold-italic">u</mml:mi>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:msubsup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <inline-formula id="inf38">
<mml:math id="m40">
<mml:mrow>
<mml:mi mathvariant="bold-italic">X</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf39">
<mml:math id="m41">
<mml:mrow>
<mml:mi mathvariant="bold-italic">Z</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> are incidence matrices relating the animals to the fixed effects and the additive effects, respectively, <inline-formula id="inf40">
<mml:math id="m42">
<mml:mrow>
<mml:mi mathvariant="bold-italic">e</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is a vector of residuals that were sampled from a normal distribution, with <inline-formula id="inf41">
<mml:math id="m43">
<mml:mrow>
<mml:mi mathvariant="bold-italic">e</mml:mi>
<mml:mo>&#x223c;</mml:mo>
<mml:mi mathvariant="bold-italic">N</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mn mathvariant="bold">0</mml:mn>
<mml:mo>,</mml:mo>
<mml:msubsup>
<mml:mi mathvariant="bold-italic">&#x3c3;</mml:mi>
<mml:mi mathvariant="bold-italic">e</mml:mi>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:msubsup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>.</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> We used the BLUPF90 family (<xref ref-type="bibr" rid="B19">Misztal et al., 2014</xref>) of programs, which includes airemlf90 and blupf90test, to estimate variance components using restricted maximum likelihood (REML). Moreover, we used predictf90 to adjust the phenotypes.</p>
<sec id="s2-2-1">
<title>2.2.1 Best Linear Unbiased Prediction (BLUP)</title>
<p>In this study, we utilized various advanced statistical models for genetic prediction. Each model has its own hypotheses, advantages, and limitations. One of the models we employed is BLUP-UPG, which incorporates unknown-parent groups (UPGs) to handle missing pedigree data. Accurate group assignments and variance estimation are crucial for this model to ensure robust predictions (<xref ref-type="bibr" rid="B13">Henderson, 1975</xref>). In our study, we encountered unknown parents only in the first generation, while we knew the parents in all subsequent generations. The use of UPGs in this model helps estimate the genetic merit of animals in the pedigree when their parents are unknown (<xref ref-type="bibr" rid="B12">Graser et al., 1987</xref>). Without defining UPGs for each breed, the genetic merit of animals with unknown parents is assumed to be equal to that of the base generation, potentially leading to biased predictions.</p>
</sec>
<sec id="s2-2-2">
<title>2.2.2 Single-Step Genomic Best Linear Unbiased Prediction (ssGBLUP)</title>
<p>Single-step GBLUP model combines phenotypes, pedigree, and genotypes into a single evaluation and replaces the pedigree relationships between genotyped individuals with realized relationships by incorporating pedigree and genomic relationships in <inline-formula id="inf42">
<mml:math id="m44">
<mml:mrow>
<mml:mi mathvariant="bold-italic">H</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> matrix, but requires significant computational resources and high-quality data. The additive (<italic>
<bold>u</bold>
</italic>) and residual (<italic>
<bold>e</bold>
</italic>) effects are assumed to be independently distributed with <inline-formula id="inf43">
<mml:math id="m45">
<mml:mrow>
<mml:mi mathvariant="bold-italic">u</mml:mi>
<mml:mo>&#x223c;</mml:mo>
<mml:mi mathvariant="bold-italic">N</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mn mathvariant="bold">0</mml:mn>
<mml:mo>,</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mi mathvariant="bold-italic">H</mml:mi>
<mml:mi mathvariant="bold-italic">&#x3c3;</mml:mi>
</mml:mrow>
<mml:mi mathvariant="bold-italic">u</mml:mi>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:msubsup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf44">
<mml:math id="m46">
<mml:mrow>
<mml:mi mathvariant="bold-italic">e</mml:mi>
<mml:mo>&#x223c;</mml:mo>
<mml:mi mathvariant="bold-italic">N</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mn mathvariant="bold">0</mml:mn>
<mml:mo>,</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mi mathvariant="bold-italic">I</mml:mi>
<mml:mi mathvariant="bold-italic">&#x3c3;</mml:mi>
</mml:mrow>
<mml:mi mathvariant="bold-italic">e</mml:mi>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:msubsup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>, respectively. The H matrix is described as:<disp-formula id="equ3">
<mml:math id="m47">
<mml:mrow>
<mml:mi mathvariant="bold-italic">H</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:mtable columnalign="center">
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi mathvariant="bold">H</mml:mi>
<mml:mn mathvariant="bold">11</mml:mn>
</mml:msub>
</mml:mtd>
<mml:mtd>
<mml:msub>
<mml:mi mathvariant="bold">H</mml:mi>
<mml:mn mathvariant="bold">12</mml:mn>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi mathvariant="bold">H</mml:mi>
<mml:mn mathvariant="bold">21</mml:mn>
</mml:msub>
</mml:mtd>
<mml:mtd>
<mml:msub>
<mml:mi mathvariant="bold">H</mml:mi>
<mml:mn mathvariant="bold">22</mml:mn>
</mml:msub>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:mtable columnalign="center">
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold">A</mml:mi>
<mml:mn mathvariant="bold">11</mml:mn>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold">A</mml:mi>
<mml:mn mathvariant="bold">22</mml:mn>
</mml:msub>
<mml:msubsup>
<mml:mi mathvariant="bold">A</mml:mi>
<mml:mn mathvariant="bold">22</mml:mn>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="bold">G</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi mathvariant="bold">G</mml:mi>
</mml:mrow>
<mml:mn mathvariant="bold">22</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:msubsup>
<mml:mi mathvariant="bold">A</mml:mi>
<mml:mn mathvariant="bold">22</mml:mn>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mi mathvariant="bold">A</mml:mi>
<mml:mn mathvariant="bold">21</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mtd>
<mml:mtd>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold">G</mml:mi>
<mml:mn mathvariant="bold">12</mml:mn>
</mml:msub>
<mml:msubsup>
<mml:mi mathvariant="bold">A</mml:mi>
<mml:mn mathvariant="bold">22</mml:mn>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mi mathvariant="bold">G</mml:mi>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:mi mathvariant="bold">G</mml:mi>
<mml:msubsup>
<mml:mi mathvariant="bold">A</mml:mi>
<mml:mn mathvariant="bold">22</mml:mn>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mi mathvariant="bold">G</mml:mi>
<mml:mn mathvariant="bold">11</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mtd>
<mml:mtd>
<mml:mi mathvariant="bold">G</mml:mi>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="equ4">
<mml:math id="m48">
<mml:mrow>
<mml:msup>
<mml:mi mathvariant="bold-italic">H</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>&#x2b;</mml:mo>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:mtable columnalign="center">
<mml:mtr>
<mml:mtd>
<mml:mn mathvariant="bold">0</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:mn mathvariant="bold">0</mml:mn>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mn mathvariant="bold">0</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:mrow>
<mml:msup>
<mml:mi mathvariant="bold-italic">G</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mi mathvariant="bold">A</mml:mi>
<mml:mn mathvariant="bold">22</mml:mn>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>where the subscript <inline-formula id="inf45">
<mml:math id="m49">
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf46">
<mml:math id="m50">
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> indicate ungenotyped and genotyped individuals, respectively. The <inline-formula id="inf47">
<mml:math id="m51">
<mml:mrow>
<mml:mi mathvariant="bold-italic">H</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> matrix can be constructed from the relationships of genotyped and ungenotyped animals (<xref ref-type="bibr" rid="B1">Aguilar et al., 2010</xref>). However, <italic>
<bold>H</bold>
</italic>
<sup>
<italic>&#x2212;<bold>1</bold>
</italic>
</sup> can be directly calculated using <inline-formula id="inf48">
<mml:math id="m52">
<mml:mrow>
<mml:msup>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf49">
<mml:math id="m53">
<mml:mrow>
<mml:msup>
<mml:mi mathvariant="bold-italic">G</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> which contain pedigree and genomic relationships related to ungenotyped and genotyped individuals, respectively, and <inline-formula id="inf50">
<mml:math id="m54">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold">A</mml:mi>
<mml:mn mathvariant="bold">22</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the pedigree relationship matrix just for genotyped animals.</p>
</sec>
<sec id="s2-2-3">
<title>2.2.3 Single-Step Genomic BLUP with Metafounders (ssGBLUP-MF-)</title>
<p>A metafounder is a pseudo-individual considered both sire and dam of all base animals. This approach extends VanRaden`s method (<xref ref-type="bibr" rid="B30">VanRaden, 1992</xref>) for estimating relationships across breeds (<xref ref-type="bibr" rid="B17">Legarra et al., 2015</xref>). To further enhance prediction accuracy in diverse populations, we incorporated metafounders in the ssGBLUP-MF model. However, this increased the complexity of the model and posed challenges in parameter estimation (<xref ref-type="bibr" rid="B17">Legarra et al., 2015</xref>). The significance of the metafounder is particularly important when considering both racial groups together. The use of different scenarios also arises from the limitation of measuring certain traits in crossbred groups, so it is inevitably based on the parental group. In our simulation, the founders in the base population of purebred parents were defined based on the number of pure breeds, so we had two metafounders.</p>
<p>In ssGBLUP, <inline-formula id="inf51">
<mml:math id="m55">
<mml:mrow>
<mml:msup>
<mml:mi mathvariant="bold">H</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> with metafounders <inline-formula id="inf52">
<mml:math id="m56">
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold-italic">H</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold">&#x393;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
</inline-formula> can be represented as (<xref ref-type="bibr" rid="B6">Christensen et al., 2015</xref>):<disp-formula id="equ5">
<mml:math id="m57">
<mml:mrow>
<mml:msubsup>
<mml:mi mathvariant="bold-italic">H</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold">&#x393;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
<mml:msubsup>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold">&#x393;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x2b;</mml:mo>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:mtable columnalign="center">
<mml:mtr>
<mml:mtd>
<mml:mn mathvariant="bold">0</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:mn mathvariant="bold">0</mml:mn>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mn mathvariant="bold">0</mml:mn>
</mml:mtd>
<mml:mtd>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi mathvariant="bold-italic">&#x3c4;</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mn mathvariant="bold">0.95</mml:mn>
<mml:mi mathvariant="bold-italic">G</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn mathvariant="bold">0.05</mml:mn>
<mml:mi mathvariant="bold-italic">A</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold">&#x393;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn mathvariant="bold">22</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mi mathvariant="bold">&#x3c9;</mml:mi>
<mml:mi mathvariant="bold">A</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold">&#x393;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn mathvariant="bold">22</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="equ6">
<mml:math id="m58">
<mml:mrow>
<mml:mi mathvariant="bold-italic">G</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:msup>
<mml:mrow>
<mml:mi mathvariant="bold-italic">Z</mml:mi>
<mml:mi mathvariant="bold-italic">Z</mml:mi>
</mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
<mml:mrow>
<mml:mn mathvariant="bold">2</mml:mn>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
<mml:mi mathvariant="bold-italic">m</mml:mi>
</mml:msubsup>
<mml:msub>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mn mathvariant="bold">1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf53">
<mml:math id="m59">
<mml:mrow>
<mml:msubsup>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold-italic">&#x393;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf54">
<mml:math id="m60">
<mml:mrow>
<mml:msup>
<mml:mi mathvariant="bold-italic">G</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> capture the inverse of the pedigree and genomic relationships, respectively. <bold>G</bold> is the genomic relationship matrix which can be calculated using matrix of allele counts <bold>(Z)</bold> and allele frequency (p) of <italic>m</italic> markers. <inline-formula id="inf55">
<mml:math id="m61">
<mml:mrow>
<mml:msubsup>
<mml:mi mathvariant="bold-italic">A</mml:mi>
<mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold-italic">&#x393;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn mathvariant="bold">22</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> represent the pedigree relationships among genotyped animals which is subtracted from genomic relationships to avoid double-counting of pedigree relationships for genotyped animals. The <inline-formula id="inf56">
<mml:math id="m62">
<mml:mrow>
<mml:mi mathvariant="bold-italic">&#x3c4;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> &#x3d; 1 and <inline-formula id="inf57">
<mml:math id="m63">
<mml:mrow>
<mml:mi mathvariant="bold-italic">&#x3c9;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> &#x3d; 1 are scaling factors used to combine <bold>G</bold> and <bold>A</bold> matrices, respectively (<xref ref-type="bibr" rid="B2">Alvarenga et al., 2020</xref>).</p>
</sec>
</sec>
<sec id="s2-3">
<title>2.3 Prediction ability (accuracy and dispersion) of purebred parents</title>
<p>The predictive ability of sires in breed A for maximizing CP was evaluated in this study using two metrics, accuracy, and dispersion. Accuracy was assessed according to <xref ref-type="bibr" rid="B9">Esfandyari et al. (2016)</xref>, by calculating the correlation between the (genomic) estimated breeding value or (G) EBV of sires in breed A and the adjusted CP mean of their crossbred progeny for the number of progenies. The correlation is likely to be higher for sires which have more progeny, as their (G) EBVs are calculated based on performance of large number of progenies. The average accuracy of mean CP was calculated as <inline-formula id="inf58">
<mml:math id="m64">
<mml:mrow>
<mml:msqrt>
<mml:mfrac>
<mml:mi mathvariant="bold-italic">n</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">n</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi mathvariant="bold-italic">k</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:msqrt>
</mml:mrow>
</mml:math>
</inline-formula> , where n is the number of progenies per sire and <inline-formula id="inf59">
<mml:math id="m65">
<mml:mrow>
<mml:mi mathvariant="bold-italic">k</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn mathvariant="bold">4</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mi mathvariant="bold-italic">h</mml:mi>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:msup>
</mml:mrow>
<mml:msup>
<mml:mi mathvariant="bold-italic">h</mml:mi>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:msup>
</mml:mfrac>
</mml:mrow>
</mml:math>
</inline-formula> is a correction factor which depends on the heritability of the trait. The predicted dispersion of (G)EBV was measured by the deviation of the slop (<inline-formula id="inf60">
<mml:math id="m66">
<mml:mrow>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>) from the regression TBVs on (G)EBVs in the crossbred population (<xref ref-type="bibr" rid="B15">Kluska et al., 2021</xref>).</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>3 Results</title>
<sec id="s3-1">
<title>3.1 Genetic connectedness between populations</title>
<p>The PCA scattered plot is shown in <xref ref-type="fig" rid="F2">Figure 2</xref>. The first two principal components (PCs) explain 8.249% and 7.92% of the total variance, respectively. The genetic relatedness between populations before simulation of <inline-formula id="inf61">
<mml:math id="m67">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> levels as measured by <inline-formula id="inf62">
<mml:math id="m68">
<mml:mrow>
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> was 0.032 between purebred parental breeds, while <inline-formula id="inf63">
<mml:math id="m69">
<mml:mrow>
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> between purebred and crossbred populations was 0.023.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Individuals clustered to three distinct groups based PC1 and PC2. In this figure, the blue, red, and green colors represent the individuals of breed A, breed B, and their crosses, respectively.</p>
</caption>
<graphic xlink:href="fgene-15-1384973-g002.tif"/>
</fig>
</sec>
<sec id="s3-2">
<title>3.2 Prediction ability</title>
<p>The prediction accuracy of the three models across scenarios is detailed in <xref ref-type="table" rid="T2">Table 2</xref>. In general, a positive correlation between prediction accuracy and <inline-formula id="inf64">
<mml:math id="m70">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> value was observed. However, the BLUP-UPG model exhibited lower accuracy than the other models at all levels of <inline-formula id="inf65">
<mml:math id="m71">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. In contrast, ssGBLUP and ssGBLUP-MF displayed inconsistent trends across their respective scenarios.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Mean and standard deviation (in parentheses) of accuracy across 10 replicates in each scenario with different genetic correlation between crossbred and purebred populations (r<sub>pc</sub>).</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="center">
<inline-formula id="inf66">
<mml:math id="m72">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi mathvariant="bold-italic">c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>
</th>
<th colspan="7" align="center">Model/Scenario</th>
</tr>
<tr>
<th align="center">BLUP-UPG</th>
<th align="center">ssGBLUP-MFSC1</th>
<th align="center">ssGBLUP-MFSC2</th>
<th align="center">ssGBLUP-SC1</th>
<th align="center">ssGBLUP-SC2</th>
<th align="center">ssGBLUP-SC3</th>
<th align="center">ssGBLUP-SC4</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">0.2</td>
<td align="center">0.114 (0.028)</td>
<td align="center">0.204 (0.019)</td>
<td align="center">0.171 (0.028)</td>
<td align="center">0.226 (0.026)</td>
<td align="center">0.195 (0.029)</td>
<td align="center">0.213 (0.022)</td>
<td align="center">0.131 (0.024)</td>
</tr>
<tr>
<td align="center">0.5</td>
<td align="center">0.343 (0.023)</td>
<td align="center">0.439 (0.021)</td>
<td align="center">0.424 (0.022)</td>
<td align="center">0.447 (0.022)</td>
<td align="center">0.339 (0.023)</td>
<td align="center">0.405 (0.030)</td>
<td align="center">0.358 (0.018)</td>
</tr>
<tr>
<td align="center">0.8</td>
<td align="center">0.505 (0.015)</td>
<td align="center">0.603 (0.014)</td>
<td align="center">0.568 (0.022)</td>
<td align="center">0.618 (0.019)</td>
<td align="center">0.631 (0.019)</td>
<td align="center">0.732 (0.016)</td>
<td align="center">0.545 (0.015)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>&#x2a; indicates the model we used, including model BLUP-UPG, Best Linear Unbiased Prediction with Unknown-Parent Groups; ssGBLUP, Single-Step Genomic BLUP, and ssGBLUP-MF, ssGBLUP, with Metafounders.</p>
</fn>
<fn>
<p>&#x2a;&#x2a; represents the scenarios of genotype selection from purebred and crossbred populations.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>Considering the first scenario encompassing genotypes (using breeds A, B, and crossbreds), ssGBLUP outperformed ssGBLUP-MF at all levels of <inline-formula id="inf67">
<mml:math id="m73">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. On the other hand, among the scenarios for selecting genotypes in ssGBLUP, SC3 (using sire genotypes) achieved the highest prediction accuracy. However, the optimal scenario depended on the <inline-formula id="inf68">
<mml:math id="m74">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> level. For example, at <inline-formula id="inf69">
<mml:math id="m75">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> values of 0.2 and 0.8, ssGBLUP-SC1 and ssGBLUP-SC3 outperformed other scenarios. Interestingly, the scenario incorporating the genotype of purebred dams (SC4) in ssGBLUP had the lowest accuracy among the scenarios, nearly the same as BLUP-UPG. Additionally, at <inline-formula id="inf70">
<mml:math id="m76">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> &#x3d; 0.8, ssGBLUP continued to outperform both ssGBLUP-MF and BLUP-UPG. Specifically, ssGBLUP-SC3 achieved an impressive prediction accuracy of 73.2%.</p>
<p>In <xref ref-type="fig" rid="F3">Figure 3</xref>, the regression coefficient (<inline-formula id="inf71">
<mml:math id="m77">
<mml:mrow>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>) of TBVs on (G)EBVs in different models is shown which can indicate the dispersion of predicted breeding values. A low regression coefficient (<inline-formula id="inf72">
<mml:math id="m78">
<mml:mrow>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> &#x3c;1.0) indicates overprediction (inflation), and <inline-formula id="inf73">
<mml:math id="m79">
<mml:mrow>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> &#x3e;1.0 shows underprediction (deflation) of GEBVs (<xref ref-type="bibr" rid="B28">Tsuruta et al., 2019</xref>). The results of our study showed a slight underprediction of)G)EBVs across all scenarios and at different levels of <inline-formula id="inf74">
<mml:math id="m80">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, the regression coefficients ranging from 1.067 to 1.220. A comparison of the regression coefficients between ssGBLUP and ssGBLUP-MF revealed that ssGBLUP-MF predictions had lower dispersion. Furthermore, ssGBLUP-SC2 and ssGBLUP-MFSC1 had minimum dispersion values at the <inline-formula id="inf75">
<mml:math id="m81">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> level of 0.2 compared to the other scenarios. At the <inline-formula id="inf76">
<mml:math id="m82">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> level of 0.5, ssGBLUP-SC2 exhibited a minor deflation in dispersion, while in contrast, ssBLUP-MFSC1 consistently displayed the lowest dispersion among all the scenarios. At the <inline-formula id="inf77">
<mml:math id="m83">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> level of 0.8, the dispersion was almost similar across all scenarios, except ssGBLUP-SC1, which exhibited a slight deflation of the <inline-formula id="inf78">
<mml:math id="m84">
<mml:mrow>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> compared to the other scenarios.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>The regression coefficient (<inline-formula id="inf79">
<mml:math id="m85">
<mml:mrow>
<mml:msub>
<mml:mi>b</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>) of TBVs on (G) EBVs for crossbred population across different scenarios and genetic correlation between crossbred and purebred populations (rpc).</p>
</caption>
<graphic xlink:href="fgene-15-1384973-g003.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>4 Discussions</title>
<p>The genetic merit of a purebred individual can be explained as: (i) its breeding value within the purebred population, and (ii) its breeding value as a purebred parent of a crossbred progeny (<xref ref-type="bibr" rid="B8">Esfandyari et al., 2018</xref>). The breeding value of a purebred parent of a crossbred offspring depends on a range of non-additive genetic effects, which can be summarized in <inline-formula id="inf80">
<mml:math id="m86">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. However, it is difficult to consider all factors in <inline-formula id="inf81">
<mml:math id="m87">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> simulation. Consequently, in this study, we focused on the overall effect of <inline-formula id="inf82">
<mml:math id="m88">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> on evaluating CP based on parental and/or crossbred data.</p>
<p>Based on the PCA graph, we observed three distinct populations. The crossbred population was positioned between the two purebred populations. This positioning was a result of simulating interbreeding within each purebred population for 210 generations, leading to complete differentiation of the two parental lines. The results of the <inline-formula id="inf83">
<mml:math id="m89">
<mml:mrow>
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> analysis also support the findings from the PCA graph. The crossbred individuals genetically possess a combination of traits from both purebred populations, as indicated by the PCA graph. This is because interbreeding was simulated within each purebred population for 210 generations. Extended breeding within each group has resulted in significant genetic differentiation, making the two purebred populations genetically distinct from each other. The <inline-formula id="inf84">
<mml:math id="m90">
<mml:mrow>
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> analysis results, which measure genetic differentiation between populations, align with the PCA graph. High <inline-formula id="inf85">
<mml:math id="m91">
<mml:mrow>
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> values indicate significant differentiation, supporting the observation that the purebred populations are distinct while the crossbred population is intermediate.</p>
<p>The increase in <inline-formula id="inf86">
<mml:math id="m92">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> level improved the prediction accuracy in all simulated scenarios. However, the prediction accuracy was not significantly different in different scenarios, which could be due to the method we used to simulate <inline-formula id="inf87">
<mml:math id="m93">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. The BLUP-UPG model showed the lowest prediction accuracy at all <inline-formula id="inf88">
<mml:math id="m94">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> levels which was expected, because it completely depended on pedigree relationships. While, genomic evaluation models which uses high-density SNP genotyping can capture relationships between individuals (with or without pedigree connection) more accurately. This may lead to optimal selection of purebred animals in parental lines for improved crossbred performance (<xref ref-type="bibr" rid="B33">Zhao et al., 2015</xref>). Our results showed that ssGBLUP-SC1 and ssGBLUP-MFSC1 provide the highest prediction accuracy in all scenarios when the <inline-formula id="inf89">
<mml:math id="m95">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> was less than 0.5. Hence, including crossbred and purebred data in the evaluation model could improve CP prediction. However, this improvement was observed only for low <inline-formula id="inf90">
<mml:math id="m96">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> value. Which could be useful when there is no emphasis on purebred performance in breeding goal (<xref ref-type="bibr" rid="B29">Van Grevenhof and Van der Werf, 2015</xref>), the reference population is large, and the genetic relatedness between crossbred population and purebred selection candidates is high (<xref ref-type="bibr" rid="B32">Wientjes et al., 2020</xref>). When the genetic relatedness between purebred and crossbred populations is high, including crossbred data only adds to model complexity and runtime as well as costs of genotyping. The accuracy of CP also depends on the heritability of the trait in purebreds and crossbreds (<xref ref-type="bibr" rid="B32">Wientjes et al., 2020</xref>). When the heritability of the trait is lower in crossbreds than purebreds, the accuracy of selection by traditional and genomic evaluations will be adversely impacted.</p>
<p>The ssGBLUP-SC3 model performed the best at the <inline-formula id="inf91">
<mml:math id="m97">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> &#x3d; 0.8, which may be due to the high number of crossbred progenies per sire in breed A. It is important to note that, if purebred QTLs are not included in the combined reference population, accuracy will be significantly reduced. In other words, the SNP effect is primarily determined by breeds that are more common in the reference population when considering the gene flow (<xref ref-type="bibr" rid="B14">Karaman et al., 2021</xref>). The linkage disequilibrium between markers and QTLs should also remain high in purebred and crossbred populations. Therefore, using high marker density can be effective in developing prediction equations and preventing loss of accuracy.</p>
<p>Based on the results, ssGBLUP in the first scenario was generally more accurate than ssGBLUP-MF. Although the accuracy of ssGBLUP-MF was expected to be slightly higher than that of ssGBLUP, in our simulated population there were no missing parents, and the base populations of the two purebreds were far apart. In real data, due to considerable number of missing parents in the pedigree, we should not assume the animals with unknown parents are associated with the same base population. Otherwise, the additive variance could not be estimated properly (<xref ref-type="bibr" rid="B20">Mrode, 2014</xref>). Therefore, considering pseudo-parents as UPG and metafounders should generally improve the prediction accuracy.</p>
<p>Our results showed a slight deflation of the predicted dispersion of (G)EBV in all scenarios. The predicted dispersion in BLUP-UPG was not significantly different to the other models. This could be due to lack of simulating missing parents and use of UPG in our BLUP-UPG model. Nevertheless, ignoring missing pedigree in BLUP model has been reported to increase the dispersion compared to the genomic models (<xref ref-type="bibr" rid="B3">Bradford et al., 2019</xref>). Although, ssGBLUP-MF displayed the lowest dispersion among all the scenarios, incorporation of MF in genomic relationship has only a small impact on the predicted dispersion compared to alternative models. It should be noted that the impact of MF depends on the number of animals with genotypes and phenotypes which are associated with each MF (<xref ref-type="bibr" rid="B15">Kluska et al., 2021</xref>). A comparison between MF and UPG revealed that MF predictions had similar or lower levels of inflation and bias (<xref ref-type="bibr" rid="B18">Masuda et al., 2019</xref>). Furthermore, ssGBLUP-MF has been reported to be more stable (<xref ref-type="bibr" rid="B15">Kluska et al., 2021</xref>). The main difference between UPGs and MFs is that in MFs the relationships within and across populations are take into account to measure the covariance of gametes transmitted from base animals to their descendants (<xref ref-type="bibr" rid="B17">Legarra et al., 2015</xref>). However, dispersion in ssGBLUP is noticeable when the pedigree is deep and incomplete, or when inbreeding is ignored in calculation of pedigree relationships (<xref ref-type="bibr" rid="B15">Kluska et al., 2021</xref>). Generally, the inflation in breeding values is common when the selected candidates have different amounts of information (<xref ref-type="bibr" rid="B22">Neves et al., 2012</xref>). In ssGBLUP, inconsistencies arise from conflicting genomic and pedigree relationship matrices, leading to variations in predictive performance. The inclusion of metafounders (MF) in ssGBLUP-MF aims to address this issue by establishing a unified base population, thereby improving the alignment of genomic and pedigree information. However, due to the simulation process, the performance of the two methods varied across different scenarios, and neither method demonstrated superior performance in all scenarios.</p>
</sec>
<sec sec-type="conclusions" id="s5">
<title>5 Conclusions</title>
<p>This study demonstrated that at low <inline-formula id="inf92">
<mml:math id="m98">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi mathvariant="bold-italic">c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> levels, employing crossbred and purebred populations in ssGBLUP and ssGBLUP-MF models resulted in enhanced predictive ability for CP. At high <inline-formula id="inf93">
<mml:math id="m99">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi mathvariant="bold-italic">c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> levels, utilizing paternal data in the ssGBLUP model yielded optimal CP predictions. The expected slightly higher accuracy of ssGBLUP-MF compared to ssGBLUP was due to the considerable genetic divergence between the base populations of the two simulated purebred populations. Nevertheless, the key factor in maximizing CP based on purebred selection was the <inline-formula id="inf94">
<mml:math id="m100">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi mathvariant="bold-italic">c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> value. Although the results can be influenced by <inline-formula id="inf95">
<mml:math id="m101">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi mathvariant="bold-italic">c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and other factors, ultimately, the selection of the most suitable model for enhancing CP depends on <inline-formula id="inf96">
<mml:math id="m102">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi mathvariant="bold-italic">c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. Further research to develop models based on purebred selection to improve CP is warranted.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s6">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec id="s7">
<title>Ethics statement</title>
<p>Ethical approval was not required for the study involving animals in accordance with the local legislation and institutional requirements because we used data produced through a simulation process.</p>
</sec>
<sec id="s8">
<title>Author contributions</title>
<p>SB: Formal Analysis, Investigation, Writing&#x2013;original draft, Data curation, Methodology. SM: Conceptualization, Writing&#x2013;review and editing, Supervision. AN: Conceptualization, Project administration, Writing&#x2013;review and editing. MK: Formal Analysis, Methodology, Validation, Writing&#x2013;original draft. HE: Conceptualization, Formal Analysis, Methodology, Validation, Writing&#x2013;review and editing.</p>
</sec>
<sec sec-type="funding-information" id="s9">
<title>Funding</title>
<p>The author(s) declare that no financial support was received for the research, authorship, and/or publication of this article.</p>
</sec>
<ack>
<p>We express our sincere gratitude to Rostam Pahlavan for his invaluable contribution to all aspects of data analysis and writing of this article. Regrettably we were unable to formally mention his name in the publication, but our appreciation for his efforts is wholehearted.</p>
</ack>
<sec sec-type="COI-statement" id="s10">
<title>Conflict of interest</title>
<p>Hadi Esfandyari was employed by Qualitas.</p>
<p>The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s11">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Aguilar</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Misztal</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Johnson</surname>
<given-names>D. L.</given-names>
</name>
<name>
<surname>Legarra</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Tsuruta</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Lawlor</surname>
<given-names>T. J.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Hot topic: a unified approach to utilize phenotypic, full pedigree, and genomic information for genetic evaluation of Holstein final score</article-title>. <source>J. dairy Sci.</source> <volume>93</volume> (<issue>2</issue>), <fpage>743</fpage>&#x2013;<lpage>752</lpage>. <pub-id pub-id-type="doi">10.3168/jds.2009-2730</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alvarenga</surname>
<given-names>A. B.</given-names>
</name>
<name>
<surname>Veroneze</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Oliveira</surname>
<given-names>H. R.</given-names>
</name>
<name>
<surname>Marques</surname>
<given-names>D. B.</given-names>
</name>
<name>
<surname>Lopes</surname>
<given-names>P. S.</given-names>
</name>
<name>
<surname>Silva</surname>
<given-names>F. F.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Comparing alternative single-step GBLUP approaches and training population designs for genomic evaluation of crossbred animals</article-title>. <source>Front. Genet.</source> <volume>263</volume>. <pub-id pub-id-type="doi">10.3389/fgene.2020.00263</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bradford</surname>
<given-names>H. L.</given-names>
</name>
<name>
<surname>Masuda</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>VanRaden</surname>
<given-names>P. M.</given-names>
</name>
<name>
<surname>Legarra</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Misztal</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Modeling missing pedigree in single-step genomic BLUP</article-title>. <source>J. Dairy Sci.</source> <volume>102</volume> (<issue>3</issue>), <fpage>2336</fpage>&#x2013;<lpage>2346</lpage>. <pub-id pub-id-type="doi">10.3168/jds.2018-15434</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brito</surname>
<given-names>F. V.</given-names>
</name>
<name>
<surname>Neto</surname>
<given-names>J. B.</given-names>
</name>
<name>
<surname>Sargolzaei</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Cobuci</surname>
<given-names>J. A.</given-names>
</name>
<name>
<surname>Schenkel</surname>
<given-names>F. S.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Accuracy of genomic selection in simulated populations mimicking the extent of linkage disequilibrium in beef cattle</article-title>. <source>BMC Genet.</source> <volume>12</volume>, <fpage>80</fpage>&#x2013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1186/1471-2156-12-80</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Christensen</surname>
<given-names>O. F.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Compatibility of pedigree-based and marker-based relationship matrices for single-step genetic evaluation</article-title>. <source>Genet. Sel. Evol.</source> <volume>44</volume>, <fpage>37</fpage>&#x2013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1186/1297-9686-44-37</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Christensen</surname>
<given-names>O. F.</given-names>
</name>
<name>
<surname>Legarra</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lund</surname>
<given-names>M. S.</given-names>
</name>
<name>
<surname>Su</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Genetic evaluation for three-way crossbreeding</article-title>. <source>Genet. Sel. Evol.</source> <volume>47</volume> (<issue>1</issue>), <fpage>98</fpage>&#x2013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1186/s12711-015-0177-6</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Christensen</surname>
<given-names>O. F.</given-names>
</name>
<name>
<surname>Lund</surname>
<given-names>M. S.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Genomic prediction when some animals are not genotyped</article-title>. <source>Genet. Sel. Evol.</source> <volume>42</volume>, <fpage>2</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1186/1297-9686-42-2</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Esfandyari</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Berg</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>S&#xf8;rensen</surname>
<given-names>A. C.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Balanced selection on purebred and crossbred performance increases gain in crossbreds</article-title>. <source>Genet. Sel. Evol.</source> <volume>50</volume>, <fpage>8</fpage>&#x2013;<lpage>14</lpage>. <pub-id pub-id-type="doi">10.1186/s12711-018-0379-9</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Esfandyari</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Bijma</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Henryon</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Christensen</surname>
<given-names>O. F.</given-names>
</name>
<name>
<surname>S&#xf8;rensen</surname>
<given-names>A. C.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Genomic prediction of crossbred performance based on purebred Landrace and Yorkshire data using a dominance model</article-title>. <source>Genet. Sel. Evol.</source> <volume>48</volume> (<issue>1</issue>), <fpage>40</fpage>&#x2013;<lpage>49</lpage>. <pub-id pub-id-type="doi">10.1186/s12711-016-0220-2</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Esfandyari</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>S&#xf8;rensen</surname>
<given-names>A. C.</given-names>
</name>
<name>
<surname>Bijma</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>A crossbred reference population can improve the response to genomic selection for crossbred performance</article-title>. <source>Genet. Sel. Evol.</source> <volume>47</volume> (<issue>1</issue>), <fpage>76</fpage>&#x2013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.1186/s12711-015-0155-z</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Falconer</surname>
<given-names>D. S.</given-names>
</name>
</person-group> (<year>1996</year>). <source>Introduction to quantitative genetics</source>. <publisher-loc>Harlow, Essex, United Kingdom</publisher-loc>: <publisher-name>Longman Group Limited</publisher-name>.</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Graser</surname>
<given-names>H. U.</given-names>
</name>
<name>
<surname>Smith</surname>
<given-names>S. P.</given-names>
</name>
<name>
<surname>Tier</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>1987</year>). <article-title>A derivative-free approach for estimating variance components in animal models by restricted maximum likelihood</article-title>. <source>J. animal Sci.</source> <volume>64</volume> (<issue>5</issue>), <fpage>1362</fpage>&#x2013;<lpage>1370</lpage>. <pub-id pub-id-type="doi">10.2527/jas1987.6451362x</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Henderson</surname>
<given-names>C. R.</given-names>
</name>
</person-group> (<year>1975</year>). <article-title>Best linear unbiased estimation and prediction under a selection model</article-title>. <source>Biometrics</source> <volume>31</volume>, <fpage>423</fpage>&#x2013;<lpage>447</lpage>. <pub-id pub-id-type="doi">10.2307/2529430</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Karaman</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Su</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Croue</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Lund</surname>
<given-names>M. S.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Genomic prediction using a reference population of multiple pure breeds and admixed individuals</article-title>. <source>Genet. Sel. Evol.</source> <volume>53</volume> (<issue>1</issue>), <fpage>46</fpage>&#x2013;<lpage>15</lpage>. <pub-id pub-id-type="doi">10.1186/s12711-021-00637-y</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kluska</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Masuda</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Ferraz</surname>
<given-names>J. B. S.</given-names>
</name>
<name>
<surname>Tsuruta</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Eler</surname>
<given-names>J. P.</given-names>
</name>
<name>
<surname>Baldi</surname>
<given-names>F.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Metafounders may reduce bias in composite cattle genomic predictions</article-title>. <source>Front. Genet.</source> <volume>12</volume>, <fpage>678587</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2021.678587</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Legarra</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Aguilar</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Misztal</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>A relationship matrix including full pedigree and genomic information</article-title>. <source>J. dairy Sci.</source> <volume>92</volume> (<issue>9</issue>), <fpage>4656</fpage>&#x2013;<lpage>4663</lpage>. <pub-id pub-id-type="doi">10.3168/jds.2009-2061</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Legarra</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Christensen</surname>
<given-names>O. F.</given-names>
</name>
<name>
<surname>Vitezica</surname>
<given-names>Z. G.</given-names>
</name>
<name>
<surname>Aguilar</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Misztal</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Ancestral relationships using metafounders: finite ancestral populations and across population relationships</article-title>. <source>Genetics</source> <volume>200</volume> (<issue>2</issue>), <fpage>455</fpage>&#x2013;<lpage>468</lpage>. <pub-id pub-id-type="doi">10.1534/genetics.115.177014</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Masuda</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Tsuruta</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Nicolazzi</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Misztal</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Single step GBLUP including more than 2 million genotypes with missing pedigrees for production traits in US Holstein</article-title>. <source>Interbull Meet.</source> <volume>22</volume>.</citation>
</ref>
<ref id="B19">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Misztal</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Tsuruta</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Lourenco</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Aguilar</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Legarra</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Vitezica</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2014</year>). <source>Manual for BLUPF90 family of programs</source>. <publisher-loc>Athens</publisher-loc>: <publisher-name>University of Georgia</publisher-name>, <fpage>199</fpage>.</citation>
</ref>
<ref id="B20">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Mrode</surname>
<given-names>R. A.</given-names>
</name>
</person-group> (<year>2014</year>). <source>Linear models for the prediction of animal breeding values</source>. <publisher-loc>Wallingford, United Kingdom</publisher-loc>: <publisher-name>CABI</publisher-name>.</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nagylaki</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>1998</year>). <article-title>Fixation indices in subdivided populations</article-title>. <source>Genetics</source> <volume>148</volume> (<issue>3</issue>), <fpage>1325</fpage>&#x2013;<lpage>1332</lpage>. <pub-id pub-id-type="doi">10.1093/genetics/148.3.1325</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Neves</surname>
<given-names>H. H.</given-names>
</name>
<name>
<surname>Carvalheiro</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Queiroz</surname>
<given-names>S. A.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>A comparison of statistical methods for genomic selection in a mice population</article-title>. <source>BMC Genet.</source> <volume>13</volume> (<issue>1</issue>), <fpage>100</fpage>&#x2013;<lpage>117</lpage>. <pub-id pub-id-type="doi">10.1186/1471-2156-13-100</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>P&#xe9;rez</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>de Los Campos</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Genome-wide regression and prediction with the BGLR statistical package</article-title>. <source>Genetics</source> <volume>198</volume> (<issue>2</issue>), <fpage>483</fpage>&#x2013;<lpage>495</lpage>. <pub-id pub-id-type="doi">10.1534/genetics.114.164442</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Prieur</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Clarke</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Brito</surname>
<given-names>L. F.</given-names>
</name>
<name>
<surname>McEwan</surname>
<given-names>J. C.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Brauning</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Estimation of linkage disequilibrium and effective population size in New Zealand sheep using three different methods to create genetic maps</article-title>. <source>BMC Genet.</source> <volume>18</volume> (<issue>1</issue>), <fpage>68</fpage>&#x2013;<lpage>19</lpage>. <pub-id pub-id-type="doi">10.1186/s12863-017-0534-2</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reich</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Price</surname>
<given-names>A. L.</given-names>
</name>
<name>
<surname>Patterson</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Principal component analysis of genetic data</article-title>. <source>Nat. Genet.</source> <volume>40</volume> (<issue>5</issue>), <fpage>491</fpage>&#x2013;<lpage>492</lpage>. <pub-id pub-id-type="doi">10.1038/ng0508-491</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Ripley</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Venables</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Bates</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Hornik</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Gebhardt</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Firth</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <source>Package &#x201c;Mass&#x201d;</source>. <publisher-name>Cran r</publisher-name> <volume>538</volume>, <fpage>113</fpage>&#x2013;<lpage>120</lpage>.</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sargolzaei</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Schenkel</surname>
<given-names>F. S.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>QMSim: a large-scale genome simulator for livestock</article-title>. <source>Bioinformatics</source> <volume>25</volume> (<issue>5</issue>), <fpage>680</fpage>&#x2013;<lpage>681</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp045</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tsuruta</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Lourenco</surname>
<given-names>D. A. L.</given-names>
</name>
<name>
<surname>Masuda</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Misztal</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Lawlor</surname>
<given-names>T. J.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Controlling bias in genomic breeding values for young genotyped bulls</article-title>. <source>J. dairy Sci.</source> <volume>102</volume> (<issue>11</issue>), <fpage>9956</fpage>&#x2013;<lpage>9970</lpage>. <pub-id pub-id-type="doi">10.3168/jds.2019-16789</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Van Grevenhof</surname>
<given-names>I. E.</given-names>
</name>
<name>
<surname>Van der Werf</surname>
<given-names>J. H.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Design of reference populations for genomic selection in crossbreeding programs</article-title>. <source>Genet. Sel. Evol.</source> <volume>47</volume> (<issue>1</issue>), <fpage>14</fpage>&#x2013;<lpage>19</lpage>. <pub-id pub-id-type="doi">10.1186/s12711-015-0104-x</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>VanRaden</surname>
<given-names>P. M.</given-names>
</name>
</person-group> (<year>1992</year>). <article-title>Accounting for inbreeding and crossbreeding in genetic evaluation of large populations</article-title>. <source>J. Dairy Sci.</source> <volume>75</volume> (<issue>11</issue>), <fpage>3136</fpage>&#x2013;<lpage>3144</lpage>. <pub-id pub-id-type="doi">10.3168/jds.s0022-0302(92)78077-1</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wei</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>van der Werf</surname>
<given-names>J. H.</given-names>
</name>
</person-group> (<year>1994</year>). <article-title>Maximizing genetic response in crossbreds using both purebred and crossbred information</article-title>. <source>Animal Sci.</source> <volume>59</volume> (<issue>3</issue>), <fpage>401</fpage>&#x2013;<lpage>413</lpage>. <pub-id pub-id-type="doi">10.1017/s0003356100007923</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wientjes</surname>
<given-names>Y. C.</given-names>
</name>
<name>
<surname>Bijma</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Calus</surname>
<given-names>M. P.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Optimizing genomic reference populations to improve crossbred performance</article-title>. <source>Genet. Sel. Evol.</source> <volume>52</volume> (<issue>1</issue>), <fpage>65</fpage>&#x2013;<lpage>18</lpage>. <pub-id pub-id-type="doi">10.1186/s12711-020-00573-3</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Mette</surname>
<given-names>M. F.</given-names>
</name>
<name>
<surname>Reif</surname>
<given-names>J. C.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Genomic selection in hybrid breeding</article-title>. <source>Plant Breed.</source> <volume>134</volume> (<issue>1</issue>), <fpage>1</fpage>&#x2013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1111/pbr.12231</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>