<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Cell. Infect. Microbiol.</journal-id>
<journal-title>Frontiers in Cellular and Infection Microbiology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Cell. Infect. Microbiol.</abbrev-journal-title>
<issn pub-type="epub">2235-2988</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fcimb.2024.1349046</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Cellular and Infection Microbiology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Comprehensive characterization of ERV-K (HML-8) in the chimpanzee genome revealed less genomic activity than humans</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Chunlei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhai</surname>
<given-names>Xiuli</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Shibo</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2601603"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Bohan</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yang</surname>
<given-names>Caiqin</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Song</surname>
<given-names>Yanmei</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Hanping</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1893716"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Liu</surname>
<given-names>Yongjian</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Han</surname>
<given-names>Jingwan</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Xiaolin</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Jingyun</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Chen</surname>
<given-names>Mingyue</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/941352"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Jia</surname>
<given-names>Lei</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1984146"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Li</surname>
<given-names>Lin</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/833045"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Microbiology, School of Basic Medicine, Anhui Medical University</institution>, <addr-line>Hefei, Anhui</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Virology, Beijing Institute of Microbiology and Epidemiology</institution>, <addr-line>Beijing</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>State Key Laboratory of Pathogen and Biosecurity</institution>, <addr-line>Beijing</addr-line>, <country>China</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>National 111 Center for Cellular Regulation and Molecular Pharmaceutics, Key Laboratory of Fermentation Engineering, Hubei University of Technology</institution>, <addr-line>Wuhan, Hubei</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Lei Huang, People's Liberation Army General Hospital, China</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Emanuela Balestrieri, University of Rome Tor Vergata, Italy</p>
<p>Tara Theresa Doucet-O'Hare, National Institutes of Health (NIH), Bethesda, United States</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Mingyue Chen, <email xlink:href="mailto:chenmy2007525@163.com">chenmy2007525@163.com</email>; Lei Jia, <email xlink:href="mailto:15001193408@163.com">15001193408@163.com</email>; Lin Li, <email xlink:href="mailto:dearwood@sina.com">dearwood@sina.com</email>
</p>
</fn>
<fn fn-type="other" id="fn003">
<p>&#x2020;These authors share first authorship</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>22</day>
<month>02</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>14</volume>
<elocation-id>1349046</elocation-id>
<history>
<date date-type="received">
<day>04</day>
<month>12</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>06</day>
<month>02</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Wang, Zhai, Wang, Zhang, Yang, Song, Li, Liu, Han, Wang, Li, Chen, Jia and Li</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Wang, Zhai, Wang, Zhang, Yang, Song, Li, Liu, Han, Wang, Li, Chen, Jia and Li</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Endogenous retroviruses (ERVs) originate from ancestral germline infections caused by exogenous retroviruses. Throughout evolution, they have become fixed within the genome of the animals into which they were integrated. As ERV elements coevolve with the host, they are normally epigenetically silenced and can become upregulated in a series of physiological and pathological processes. Generally, a detailed ERV profile in the host genome is critical for understanding the evolutionary history and functional performance of the host genome. We previously characterized and cataloged all the ERV-K subtype HML-8 loci in the human genome; however, this has not been done for the chimpanzee, the nearest living relative of humans. In this study, we aimed to catalog and characterize the integration of HML-8 in the chimpanzee genome and compare it with the integration of HML-8 in the human genome. We analyzed the integration of HML-8 and found that HML-8 pervasively invaded the chimpanzee genome. A total of 76 proviral elements were characterized on 23/24 chromosomes, including detailed elements distribution, structure, phylogeny, integration time, and their potential to regulate adjacent genes. The incomplete structure of HML-8 proviral LTRs will undoubtedly affect their activity. Moreover, the results indicated that HML-8 integration occurred before the divergence between humans and chimpanzees. Furthermore, chimpanzees include more HML-8 proviral elements (76 vs. 40) and fewer solo long terminal repeats (LTR) (0 vs. 5) than humans. These results suggested that chimpanzee genome activity is less than the human genome and that humans may have a better ability to shape and screen integrated proviral elements. Our work is informative in both an evolutionary and a functional context for ERVs.</p>
</abstract>
<kwd-group>
<kwd>endogenous retroviruses</kwd>
<kwd>chimpanzee</kwd>
<kwd>human</kwd>
<kwd>characterization</kwd>
<kwd>evolution</kwd>
</kwd-group>
<counts>
<fig-count count="6"/>
<table-count count="3"/>
<equation-count count="0"/>
<ref-count count="41"/>
<page-count count="19"/>
<word-count count="9894"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Virus and Host</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Endogenous retroviruses have played a role in primate evolution and result from exogenous retroviral infections, which integrate into the genome of the host germline and are subsequently inherited by the next generation (<xref ref-type="bibr" rid="B36">Stoye, 2012</xref>; <xref ref-type="bibr" rid="B31">Mager and Stoye, 2015</xref>; <xref ref-type="bibr" rid="B16">Jansz and Faulkner, 2021</xref>). ERVs can be found in all vertebrate genomes (<xref ref-type="bibr" rid="B36">Stoye, 2012</xref>; <xref ref-type="bibr" rid="B16">Jansz and Faulkner, 2021</xref>). For human endogenous retroviruses (HERVs), all residual components of HERVs have accounted for approximately 8% of the whole human genome (<xref ref-type="bibr" rid="B41">Venter et&#xa0;al., 2001</xref>; <xref ref-type="bibr" rid="B19">Jia et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B28">Liu et&#xa0;al., 2023</xref>). The proviral genome consists of a long terminal repeat (LTR) at both ends and four internal open reading frames. The LTRs at both ends contain functional regulatory elements, such as promoters, enhancers, and transcription factor-binding sites (<xref ref-type="bibr" rid="B1">Bannert and Kurth, 2004</xref>). The <italic>gag</italic> gene encodes structural proteins of the virus, including matrix (MA), capsid (CA), and nucleocapsid protein (NC). MA forms layer on the inside of the viral envelope and play important roles in virus assembly, as they form links or bridge between nucleocapsids/cores and the envelope. CA is the major structural component and plays a key role in the viral assembly and budding processes. NC is a small zinc finger protein that possesses nucleic acid chaperone activity that enables NC to rearrange DNA and RNA molecules into the most thermodynamically stable structures. The <italic>pro</italic> gene encodes a protease playing a central role in proteolytic processing. The <italic>pol</italic> gene encodes open reading frames for the proteins reverse transcriptase (RT) and integrase (IN). RT is responsible for converting RNA into complementary DNA, a key step in retrovirus replication. IN mediates the insertion of ERVs into the genome of the host cell. The <italic>env</italic> gene encodes surface and transmembrane proteins that participate in the assembly of retrovirus-like particles (<xref ref-type="bibr" rid="B32">Ono, 1986</xref>). Many of the coding regions of proviruses have lost the ability to encode functional proteins due to mutations, insertions, deletions, and rearrangements. In addition, the proviruses occasionally undergo homologous recombination between ancestral 5&#x2019; and 3&#x2019; proviral LTRs, where the intervening protein-coding sequence is deleted to form a separate solitary (or &#x201c;solo&#x201d;) LTR. It was reported that at least 85% of ERV cases are solitary (or &#x201c;solo&#x201d;) LTRs (<xref ref-type="bibr" rid="B25">Lander et&#xa0;al., 2001</xref>; <xref ref-type="bibr" rid="B31">Mager and Stoye, 2015</xref>). Surprisingly, there are few similarities between the LTRs of retroviruses from different genera (<xref ref-type="bibr" rid="B4">Benachenhou et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B20">Johnson, 2019</xref>).</p>
<p>There are many types of ERVs which can be classified according to their phylogenetic relationships. The three main categories are: Class I represents &#x3b3; retrovirus-like elements, Class II represents &#x3b2; retrovirus-like elements, and Class III represents spuma virus-like elements (<xref ref-type="bibr" rid="B40">Vargiu et&#xa0;al., 2016</xref>). The ERV-K group, which belongs to Class II, contains 11 subtypes, which are called Human MMTV Like, so they are named HML with a number (HML1-11). The ERV-K is the most studied group (<xref ref-type="bibr" rid="B3">Barbulescu et&#xa0;al., 1999</xref>). In addition to HML-2, HML-6, HML-7, HML-8, and HML-9 have also attracted the attention of many researchers (<xref ref-type="bibr" rid="B26">Lavie et&#xa0;al., 2004</xref>; <xref ref-type="bibr" rid="B8">Flockerzi et&#xa0;al., 2005</xref>; <xref ref-type="bibr" rid="B6">Broecker et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B35">Scognamiglio et&#xa0;al., 2022</xref>).</p>
<p>Most sequences of ERVs have been mutated and inactivated, but some ERVs can still be expressed and play important roles in some physiological processes. Studies have shown that ERV transcription occurs in healthy cells and tissues, including embryos and placentas (<xref ref-type="bibr" rid="B36">Stoye, 2012</xref>). In addition, aberrant expression of ERVs occurs in several diseases, such as multiple sclerosis and breast cancer, and their proteins may contribute to disease etiology (<xref ref-type="bibr" rid="B16">Jansz and Faulkner, 2021</xref>). It has been reported that HERV-K (HML-2) is a risk factor for multiple sclerosis (<xref ref-type="bibr" rid="B9">Garcia-Montojo et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B13">Holloway et&#xa0;al., 2019</xref>). In addition, the transcription level of ERV is increased in breast cancer, teratoma, ovarian tumor, and melanoma (<xref ref-type="bibr" rid="B9">Garcia-Montojo et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B20">Johnson, 2019</xref>; <xref ref-type="bibr" rid="B16">Jansz and Faulkner, 2021</xref>; <xref ref-type="bibr" rid="B7">Chen et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B19">Jia et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B28">Liu et&#xa0;al., 2023</xref>). In summary, although many ERVs have acquired mutations and are not actively expressed, there are ERV loci that continue to have important biological functions.</p>
<p>Therefore, considering the substantial contribution of ERVs to the host genome and their emerging roles in shaping the host&#x2019;s regulatory networks, exploring the dynamic expression and function of ERVs is important for understanding both human- and primate-specific aspects of gene regulation and development, including physiological and pathological processes (<xref ref-type="bibr" rid="B24">Kunarso et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B12">Grow et&#xa0;al., 2015</xref>). Before the dynamics of ERVs can be examined, it is essential to first determine the distribution and position of ERVs in the host genome. Many studies have focused on ERV elements in the human genome, but only a few have concentrated on these elements within the nonhuman primate genome. For chimpanzees, which are the closest living relative of humans, previous work revealed 45 HML-2 elements inserted specifically into the chimpanzee genome (<xref ref-type="bibr" rid="B29">Macfarlane and Badge, 2015</xref>). The results indicated that, compared with humans, the chimpanzee genome contains less chimpanzee-specific HML-2 integration. In addition, little work has been done to characterize ERVs in chimpanzees and compare these with those of other primates, such as gorillas and humans (<xref ref-type="bibr" rid="B13">Holloway et&#xa0;al., 2019</xref>). Previously, we performed comprehensive identification and characterization of the ERV-K (HML-8) group in the human genome (<xref ref-type="bibr" rid="B28">Liu et&#xa0;al., 2023</xref>). However, the distribution and function of HML-8 elements in other primates, such as chimpanzees remain unclear, and comparisons of the genomic distribution, integration time, and potential regulatory roles between the two hosts have not been performed. Chimpanzees are the closest living relative of human beings (<xref ref-type="bibr" rid="B2">Bannert and Kurth, 2006</xref>). Therefore, accurate and complete characterization of HML-8 elements in the chimpanzee genome is needed to compare the evolutionary forces underlying the 2 recent speciation patterns of mammalian groups. This work will facilitate the study of the existence, evolutionary relationship, and function of ERVs in primates, potentially helping to elucidate the pathogenesis of serious human diseases.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>21</label>
<title>HML-8 identification, localization, and genomic distribution</title>
<p>We used Jan. 2018 (Clint_PTRv2/panTro6) as the chimpanzee reference genome to determine the distribution of HML-8 remnants in the chimpanzee genome. The assembled MER11A-HERVK11-MER11A sequence from the Dfam database was used as a query for the HML-8 reference (<xref ref-type="bibr" rid="B14">Hubley et&#xa0;al., 2016</xref>) (<ext-link ext-link-type="uri" xlink:href="https://dfam.org/home">https://dfam.org/home</ext-link>). There are typically two resources for reference: consensus representatives and single best representatives. Compared to the single best representative, which is a specific and high-quality ERV sequence for HML-8, the consensus sequence for HML-8 has a much broader representation. Therefore, consensus representatives are used as references or queries in most studies (<xref ref-type="bibr" rid="B10">Grandi et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B33">Pisano et&#xa0;al., 2019</xref>). The BLAT search tool in the UCSC genome browser database was used to detect the integrated HML-8 elements (<xref ref-type="bibr" rid="B21">Kent, 2002</xref>; <xref ref-type="bibr" rid="B22">Kent et&#xa0;al., 2002</xref>). BLAT on DNA is designed to quickly find sequences of 95% and greater similarity of length 25 bases or more. BLAT functions in DNA alignment by keeping an index of the entire genome in its memory. The index consists of all overlapping 11-mers stepping by 5 except for those heavily involved in repeats (<ext-link ext-link-type="uri" xlink:href="http://genome.ucsc.edu/cgi-bin/hgBlat">http://genome.ucsc.edu/cgi-bin/hgBlat</ext-link>). Additionally, the expected distribution of HML-8 loci on each chromosome was calculated according to the Formula e=Cl &#xd7; N/Tl (e is the expected integration number in the chromosome, Cl represents the nongap length of the chromosome, N represents the total number of actual HML-8 loci identified in the human genome, and Tl represents the total nongap length of all chromosomes) (<xref ref-type="bibr" rid="B11">Grandi et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B19">Jia et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B28">Liu et&#xa0;al., 2023</xref>). Chi-square (&#x3c7;2) tests were performed to analyze the difference between the expected integration number and the actual number of HML-8 loci and to estimate the statistical significance based on the <italic>p</italic> value.</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Structural characterization</title>
<p>The length and structure of all the HML-8 provirus remnants were characterized via multiple alignments with the Dfam reference MER11A-HERVK11-MER11A performed with MEGA 7 and the BioEdit software platform (<xref ref-type="bibr" rid="B23">Kumar et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B38">Tamura et&#xa0;al., 2021</xref>). All the structural details, including insertions and deletions, were annotated.</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Phylogenetic analyses</title>
<p>To confirm the assignment of the identified HML-8 elements in the chimpanzee genome, maximum likelihood (ML) phylogenetic trees were constructed using MEGA 7 (<xref ref-type="bibr" rid="B23">Kumar et&#xa0;al., 2016</xref>). Elements containing many gaps were eliminated manually. Three proviral sequences (longer than 80% of the HML-8 reference length) were screened to determine their phylogenetic relationships. Using the model selection function in MEGA7, the best-fit model of nucleotide substitution for these near full-length proviruses was the general time reversible model with a gamma distribution and invariant sites (GTR+G+I). Additionally, elements longer than 90% of the corresponding 4 coding regions of HML-8 were screened to construct subregion phylogenetic trees, respectively. Based on the model selection model in MEGA7, the most suitable nucleotide substitution models for <italic>gag</italic>, <italic>pro</italic>, <italic>pol</italic> and <italic>env</italic> analysis are as follows: the Hasegawa-Kishino-Yano model with a gamma distribution and invariant sites (HKY+G+I); the general time reversible model with a gamma distribution and invariant sites (GTR+G+I); the general time reversible model with a gamma distribution (GTR+G); and the Hasegawa-Kishino-Yano model with a gamma distribution (HKY+G). The nearest neighbor interchange (NNI) procedure was used to search for the tree topology. The nearest neighbor interchange is a heuristic search to improve the likelihood of a tree by performing the following operation on it. If we have two unrooted trees, then we can specify a neighbor relation between the two of them and then swap their subtrees in an attempt to obtain a tree that has a higher likelihood (<ext-link ext-link-type="uri" xlink:href="https://www.megasoftware.net/webhelp/centraldialogbox_hc/nearest_neighbor_interchange_nni_.htm">https://www.megasoftware.net/webhelp/centraldialogbox_hc/nearest_neighbor_interchange_nni_.htm</ext-link>). The confidence of each node in the phylogenetic trees was determined using the bootstrap test with 500 bootstrap replicates. The final trees were visualized by iTOL (<xref ref-type="bibr" rid="B38">Tamura et&#xa0;al., 2021</xref>).</p>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Estimation of the integration time of HML-8 members in the chimpanzee genome</title>
<p>To estimate the integration time of each HML-8 element in the chimpanzee genome, we used a substitution rate of 0.2%/nucleotide/million years to evaluate the divergence effect on every HML-8 (<xref ref-type="bibr" rid="B27">Lebedev et&#xa0;al., 2000</xref>). For the 4 internal regions (<italic>gag</italic>, <italic>pro</italic>, <italic>pol</italic>, and <italic>env</italic>), the integration time was calculated based on the Formula T&#x2009;=&#x2009;D/0.2. For the flanking LTR regions, the integration time was calculated based on the Formula T&#x2009;=&#x2009;D/0.2/2. T represents the estimated time of integration (in million years). D represents the percentage of divergent nucleotides, and the D of each HML-8 element was estimated in two ways: (1) between the 5&#x2019; and 3&#x2019; LTRs of each provirus and (2) between each HML-8 internal element and its consensus generated. The divergence values were calculated with MEGA7.</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Functional prediction of cis-regulatory regions and enrichment analysis</title>
<p>The noncoding LTR regions of HML-8 lack biological function annotations in the chimpanzee genome. To understand the biological significance of the HML-8 proviral LTRs, we performed functional prediction and enrichment analysis of the cis-regulatory regions of these HML-8 chimpanzees. Based on the Genomic Regions Enrichment of Annotations Tool (GREAT), gene annotations near HML-8 proviral LTRs were analyzed. The association rules were as follows: basal + extension, 5000 bp upstream, 1000 bp downstream, and 1000000 bp maximum extension; curated regulatory domains were included. When the potential regulatory genes were identified, the WEB-based Gene SeT Analysis Toolkit (WebGestalt) was subsequently used to analyze their functional enrichment (<ext-link ext-link-type="uri" xlink:href="http://www.webge">http://www.webge</ext-link> stage). org). This approach is crucial for interpreting the list of genes of interest. The enrichment method used here was overrepresentation analysis (ORA). The parameters for the enrichment analysis included the following: minimum number of IDs in the category: 5; maximum number of IDs in the category: 2000; FDR Method: Benjamini&#x2013;Hochberg (BH); and significance level: top 10.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>Identification, localization, and distribution of HML-8 remnants in the chimpanzee genome [Jan.2018 (Clint_PTRv2/panTro6)]</title>
<p>The results showed that HML-8 elements pervasively invaded the chimpanzee genome. According to the BLAT results obtained for MER11A-HERVK11-MER11A in Jan. 2018 (Clint_PTRv2/panTro6), we identified a total of 76 HML-8 proviral elements (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>), as compared to the 40 proviral elements we identified in the human genome (<xref ref-type="bibr" rid="B28">Liu et&#xa0;al., 2023</xref>). Based on the integrated genomic loci, each HML-8 element was named according to the nomenclature previously proposed for HERV-K elements (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>) (<xref ref-type="bibr" rid="B37">Subramanian et&#xa0;al., 2011</xref>). First, we observed a notable feature: there was no complete full-length element of HML-8 in the chimpanzee genome. The longest proviral element was 9158 bp long, which accounted for 84.7% of the reference sequence. The length analysis revealed that the average length of these proviral elements was 4378 bp, with 9 elements being greater than 70% of the reference length, 21 elements being between 40 and 70% of the reference length, and the remaining 46 elements being between 8.14 and 37.49% (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). Among them, the shortest proviral element was 875 bp long, which accounted for only 8.14% of the reference sequence. The longest and shortest HML-8 proviral elements in the human genome are 9162 and 874, respectively. This similarity suggested that the integration events of HML-8 simultaneously occurred before the divergence between humans and chimpanzees.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>HML-8 provirus distribution.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Number</th>
<th valign="middle" align="center">Chromosome</th>
<th valign="middle" align="center">Strand</th>
<th valign="middle" align="center">Position start</th>
<th valign="middle" align="center">Position end</th>
<th valign="middle" align="center">Length (bp)</th>
<th valign="middle" align="center">Match+mismatch(bp)/full length(bp)</th>
<th valign="middle" align="center">Range</th>
<th valign="middle" align="center">Qgap(bp)/match+mismatch+Qgap(bp)</th>
<th valign="middle" align="center">Insertion or deletion</th>
<th valign="top" align="center">Intergenic/intron/exon</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">1</td>
<td valign="top" align="center">chr11</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">97063674</td>
<td valign="top" align="center">97072831</td>
<td valign="top" align="center">9158</td>
<td valign="top" align="center">84.70%</td>
<td valign="top" align="center">&#x3010;80%-90%)</td>
<td valign="top" align="center">3.28%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">2</td>
<td valign="top" align="center">chr19</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">23582963</td>
<td valign="top" align="center">23597406</td>
<td valign="top" align="center">14444</td>
<td valign="top" align="center">81.45%</td>
<td valign="top" align="center">&#x3010;80%-90%)</td>
<td valign="top" align="center">5.78%</td>
<td valign="top" align="center">Insertion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">3</td>
<td valign="top" align="center">chr17</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">28556159</td>
<td valign="top" align="center">28565079</td>
<td valign="top" align="center">8921</td>
<td valign="top" align="center">81.22%</td>
<td valign="top" align="center">&#x3010;80%-90%)</td>
<td valign="top" align="center">9.29%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">4</td>
<td valign="top" align="center">chr1</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">156345936</td>
<td valign="top" align="center">156354251</td>
<td valign="top" align="center">8316</td>
<td valign="top" align="center">76.67%</td>
<td valign="top" align="center">&#x3010;70%-80%)</td>
<td valign="top" align="center">12.10%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">5</td>
<td valign="top" align="center">chr9</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">31695596</td>
<td valign="top" align="center">31703805</td>
<td valign="top" align="center">8210</td>
<td valign="top" align="center">76.57%</td>
<td valign="top" align="center">&#x3010;70%-80%)</td>
<td valign="top" align="center">2.80%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">6</td>
<td valign="top" align="center">chr5</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">52655093</td>
<td valign="top" align="center">52662923</td>
<td valign="top" align="center">7831</td>
<td valign="top" align="center">73.29%</td>
<td valign="top" align="center">&#x3010;70%-80%)</td>
<td valign="top" align="center">4.76%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">7</td>
<td valign="top" align="center">chr19</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">25615095</td>
<td valign="top" align="center">25622844</td>
<td valign="top" align="center">7750</td>
<td valign="top" align="center">71.85%</td>
<td valign="top" align="center">&#x3010;70%-80%)</td>
<td valign="top" align="center">6.43%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">8</td>
<td valign="top" align="center">chr12</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">51714625</td>
<td valign="top" align="center">51722440</td>
<td valign="top" align="center">7816</td>
<td valign="top" align="center">70.94%</td>
<td valign="top" align="center">&#x3010;70%-80%)</td>
<td valign="top" align="center">7.63%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">9</td>
<td valign="top" align="center">chr6</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">73941843</td>
<td valign="top" align="center">73949302</td>
<td valign="top" align="center">7460</td>
<td valign="top" align="center">70.49%</td>
<td valign="top" align="center">&#x3010;70%-80%)</td>
<td valign="top" align="center">4.11%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">10</td>
<td valign="top" align="center">chr9</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">84591713</td>
<td valign="top" align="center">84599232</td>
<td valign="top" align="center">7520</td>
<td valign="top" align="center">69.51%</td>
<td valign="top" align="center">&#x3010;60%-70%)</td>
<td valign="top" align="center">24.21%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intron</td>
</tr>
<tr>
<td valign="middle" align="left">11</td>
<td valign="top" align="center">chr3</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">79615035</td>
<td valign="top" align="center">79622061</td>
<td valign="top" align="center">7027</td>
<td valign="top" align="center">64.57%</td>
<td valign="top" align="center">&#x3010;60%-70%)</td>
<td valign="top" align="center">17.82%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intron</td>
</tr>
<tr>
<td valign="middle" align="left">12</td>
<td valign="top" align="center">chrX</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">56602551</td>
<td valign="top" align="center">56609242</td>
<td valign="top" align="center">6692</td>
<td valign="top" align="center">63.26%</td>
<td valign="top" align="center">&#x3010;60%-70%)</td>
<td valign="top" align="center">4.37%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">13</td>
<td valign="top" align="center">chr1</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">135696367</td>
<td valign="top" align="center">135712562</td>
<td valign="top" align="center">16196</td>
<td valign="top" align="center">61.48%</td>
<td valign="top" align="center">&#x3010;60%-70%)</td>
<td valign="top" align="center">6.97%</td>
<td valign="top" align="center">Insertion</td>
<td valign="top" align="center">intron</td>
</tr>
<tr>
<td valign="middle" align="left">14</td>
<td valign="top" align="center">chr11</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">63656712</td>
<td valign="top" align="center">63663509</td>
<td valign="top" align="center">6798</td>
<td valign="top" align="center">59.90%</td>
<td valign="top" align="center">&#x3010;50%-60%)</td>
<td valign="top" align="center">31.36%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">15</td>
<td valign="top" align="center">chr2A</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">64123614</td>
<td valign="top" align="center">64129736</td>
<td valign="top" align="center">6123</td>
<td valign="top" align="center">57.81%</td>
<td valign="top" align="center">&#x3010;50%-60%)</td>
<td valign="top" align="center">20.10%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intron</td>
</tr>
<tr>
<td valign="middle" align="left">16</td>
<td valign="top" align="center">chr3</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">128565266</td>
<td valign="top" align="center">128571536</td>
<td valign="top" align="center">6271</td>
<td valign="top" align="center">57.64%</td>
<td valign="top" align="center">&#x3010;50%-60%)</td>
<td valign="top" align="center">25.16%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intron</td>
</tr>
<tr>
<td valign="middle" align="left">17</td>
<td valign="top" align="center">chr12</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">81696811</td>
<td valign="top" align="center">81702819</td>
<td valign="top" align="center">6009</td>
<td valign="top" align="center">56.24%</td>
<td valign="top" align="center">&#x3010;50%-60%)</td>
<td valign="top" align="center">13.24%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">18</td>
<td valign="top" align="center">chr11</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">49590235</td>
<td valign="top" align="center">49596119</td>
<td valign="top" align="center">5885</td>
<td valign="top" align="center">54.38%</td>
<td valign="top" align="center">&#x3010;50%-60%)</td>
<td valign="top" align="center">5.42%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">19</td>
<td valign="top" align="center">chr10</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">98677603</td>
<td valign="top" align="center">98683109</td>
<td valign="top" align="center">5507</td>
<td valign="top" align="center">50.71%</td>
<td valign="top" align="center">&#x3010;50%-60%)</td>
<td valign="top" align="center">37.81%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">genic &amp;intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">20</td>
<td valign="top" align="center">chr1</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">108430301</td>
<td valign="top" align="center">108435591</td>
<td valign="top" align="center">5291</td>
<td valign="top" align="center">49.26%</td>
<td valign="top" align="center">&#x3010;40%-50%)</td>
<td valign="top" align="center">32.31%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">21</td>
<td valign="top" align="center">chrY</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">23381750</td>
<td valign="top" align="center">23386956</td>
<td valign="top" align="center">5207</td>
<td valign="top" align="center">48.45%</td>
<td valign="top" align="center">&#x3010;40%-50%)</td>
<td valign="top" align="center">31.40%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">22</td>
<td valign="top" align="center">chr11</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">50352478</td>
<td valign="top" align="center">50357771</td>
<td valign="top" align="center">5294</td>
<td valign="top" align="center">48.21%</td>
<td valign="top" align="center">&#x3010;40%-50%)</td>
<td valign="top" align="center">9.03%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">23</td>
<td valign="top" align="center">chr11</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">49637737</td>
<td valign="top" align="center">49642530</td>
<td valign="top" align="center">4794</td>
<td valign="top" align="center">43.57%</td>
<td valign="top" align="center">&#x3010;40%-50%)</td>
<td valign="top" align="center">35.29%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">24</td>
<td valign="top" align="center">chr4</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">137449286</td>
<td valign="top" align="center">137454131</td>
<td valign="top" align="center">4846</td>
<td valign="top" align="center">42.39%</td>
<td valign="top" align="center">&#x3010;40%-50%)</td>
<td valign="top" align="center">45.12%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">25</td>
<td valign="top" align="center">chr12</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">102968149</td>
<td valign="top" align="center">102972730</td>
<td valign="top" align="center">4582</td>
<td valign="top" align="center">42.14%</td>
<td valign="top" align="center">&#x3010;40%-50%)</td>
<td valign="top" align="center">8.05%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">26</td>
<td valign="top" align="center">chr3</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">109740319</td>
<td valign="top" align="center">109744759</td>
<td valign="top" align="center">4441</td>
<td valign="top" align="center">41.74%</td>
<td valign="top" align="center">&#x3010;40%-50%)</td>
<td valign="top" align="center">30.22%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">27</td>
<td valign="top" align="center">chr11</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">14869711</td>
<td valign="top" align="center">14874159</td>
<td valign="top" align="center">4449</td>
<td valign="top" align="center">41.19%</td>
<td valign="top" align="center">&#x3010;40%-50%)</td>
<td valign="top" align="center">26.33%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">28</td>
<td valign="top" align="center">chr4</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">64843173</td>
<td valign="top" align="center">64847502</td>
<td valign="top" align="center">4330</td>
<td valign="top" align="center">40.68%</td>
<td valign="top" align="center">&#x3010;40%-50%)</td>
<td valign="top" align="center">3.57%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">29</td>
<td valign="top" align="center">chrX</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">34789238</td>
<td valign="top" align="center">34793597</td>
<td valign="top" align="center">4360</td>
<td valign="top" align="center">40.26%</td>
<td valign="top" align="center">&#x3010;40%-50%)</td>
<td valign="top" align="center">24.69%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">30</td>
<td valign="top" align="center">chr8</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">44511870</td>
<td valign="top" align="center">44516437</td>
<td valign="top" align="center">4568</td>
<td valign="top" align="center">40.01%</td>
<td valign="top" align="center">&#x3010;40%-50%)</td>
<td valign="top" align="center">7.33%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">31</td>
<td valign="top" align="center">chr6</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">155777868</td>
<td valign="top" align="center">155781847</td>
<td valign="top" align="center">3980</td>
<td valign="top" align="center">37.49%</td>
<td valign="top" align="center">&#x3010;30%-40%)</td>
<td valign="top" align="center">1.50%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">exonic&amp;intronic</td>
</tr>
<tr>
<td valign="middle" align="left">32</td>
<td valign="top" align="center">chr19</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">24073629</td>
<td valign="top" align="center">24078094</td>
<td valign="top" align="center">4466</td>
<td valign="top" align="center">36.96%</td>
<td valign="top" align="center">&#x3010;30%-40%)</td>
<td valign="top" align="center">4.79%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">33</td>
<td valign="top" align="center">chr4</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">77803811</td>
<td valign="top" align="center">77807756</td>
<td valign="top" align="center">3946</td>
<td valign="top" align="center">36.44%</td>
<td valign="top" align="center">&#x3010;30%-40%)</td>
<td valign="top" align="center">34.61%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">34</td>
<td valign="top" align="center">chr8</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">12333790</td>
<td valign="top" align="center">12337817</td>
<td valign="top" align="center">4028</td>
<td valign="top" align="center">36.18%</td>
<td valign="top" align="center">&#x3010;30%-40%)</td>
<td valign="top" align="center">27.03%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intron</td>
</tr>
<tr>
<td valign="middle" align="left">35</td>
<td valign="top" align="center">chr7</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">6075204</td>
<td valign="top" align="center">6079128</td>
<td valign="top" align="center">3925</td>
<td valign="top" align="center">35.29%</td>
<td valign="top" align="center">&#x3010;30%-40%)</td>
<td valign="top" align="center">28.35%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intron</td>
</tr>
<tr>
<td valign="middle" align="left">36</td>
<td valign="top" align="center">chr8</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">43749874</td>
<td valign="top" align="center">43753733</td>
<td valign="top" align="center">3860</td>
<td valign="top" align="center">34.71%</td>
<td valign="top" align="center">&#x3010;30%-40%)</td>
<td valign="top" align="center">38.35%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">37</td>
<td valign="top" align="center">chrY</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">6360429</td>
<td valign="top" align="center">6370254</td>
<td valign="top" align="center">9826</td>
<td valign="top" align="center">34.32%</td>
<td valign="top" align="center">&#x3010;30%-40%)</td>
<td valign="top" align="center">38.19%</td>
<td valign="top" align="center">Insertion,Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">38</td>
<td valign="top" align="center">chr8</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">86619640</td>
<td valign="top" align="center">86623356</td>
<td valign="top" align="center">3717</td>
<td valign="top" align="center">34.09%</td>
<td valign="top" align="center">&#x3010;30%-40%)</td>
<td valign="top" align="center">34.77%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">39</td>
<td valign="top" align="center">chr20</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">29240803</td>
<td valign="top" align="center">29250628</td>
<td valign="top" align="center">9826</td>
<td valign="top" align="center">34.03%</td>
<td valign="top" align="center">&#x3010;30%-40%)</td>
<td valign="top" align="center">38.72%</td>
<td valign="top" align="center">Insertion,Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">40</td>
<td valign="top" align="center">chr4</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">77195305</td>
<td valign="top" align="center">77198763</td>
<td valign="top" align="center">3459</td>
<td valign="top" align="center">32.47%</td>
<td valign="top" align="center">&#x3010;30%-40%)</td>
<td valign="top" align="center">4.25%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">41</td>
<td valign="top" align="center">chr2A</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">102337670</td>
<td valign="top" align="center">102341003</td>
<td valign="top" align="center">3334</td>
<td valign="top" align="center">31.08%</td>
<td valign="top" align="center">&#x3010;30%-40%)</td>
<td valign="top" align="center">11.22%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">42</td>
<td valign="top" align="center">chr5</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">150548523</td>
<td valign="top" align="center">150551566</td>
<td valign="top" align="center">3044</td>
<td valign="top" align="center">28.84%</td>
<td valign="top" align="center">&#x3010;20%-30%)</td>
<td valign="top" align="center">28.68%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intron</td>
</tr>
<tr>
<td valign="middle" align="left">43</td>
<td valign="top" align="center">chr7</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">50863865</td>
<td valign="top" align="center">50867270</td>
<td valign="top" align="center">3406</td>
<td valign="top" align="center">27.87%</td>
<td valign="top" align="center">&#x3010;20%-30%)</td>
<td valign="top" align="center">28.99%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">44</td>
<td valign="top" align="center">chr1</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">45743923</td>
<td valign="top" align="center">45746943</td>
<td valign="top" align="center">3021</td>
<td valign="top" align="center">27.13%</td>
<td valign="top" align="center">&#x3010;20%-30%)</td>
<td valign="top" align="center">10.68%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">45</td>
<td valign="top" align="center">chrX</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">41627863</td>
<td valign="top" align="center">41630750</td>
<td valign="top" align="center">2888</td>
<td valign="top" align="center">26.01%</td>
<td valign="top" align="center">&#x3010;20%-30%)</td>
<td valign="top" align="center">13.10%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intron</td>
</tr>
<tr>
<td valign="middle" align="left">46</td>
<td valign="top" align="center">chrX</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">42154219</td>
<td valign="top" align="center">42156882</td>
<td valign="top" align="center">2664</td>
<td valign="top" align="center">24.40%</td>
<td valign="top" align="center">&#x3010;20%-30%)</td>
<td valign="top" align="center">13.70%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">47</td>
<td valign="top" align="center">chr22</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">1446161</td>
<td valign="top" align="center">1448721</td>
<td valign="top" align="center">2561</td>
<td valign="top" align="center">23.70%</td>
<td valign="top" align="center">&#x3010;20%-30%)</td>
<td valign="top" align="center">1.58%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intron</td>
</tr>
<tr>
<td valign="middle" align="left">48</td>
<td valign="top" align="center">chr16</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">44723847</td>
<td valign="top" align="center">44726410</td>
<td valign="top" align="center">2564</td>
<td valign="top" align="center">23.53%</td>
<td valign="top" align="center">&#x3010;20%-30%)</td>
<td valign="top" align="center">11.83%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">49</td>
<td valign="top" align="center">chrY</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">3095532</td>
<td valign="top" align="center">3098114</td>
<td valign="top" align="center">2583</td>
<td valign="top" align="center">23.20%</td>
<td valign="top" align="center">&#x3010;20%-30%)</td>
<td valign="top" align="center">14.79%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">50</td>
<td valign="top" align="center">chrY</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">13438427</td>
<td valign="top" align="center">13440964</td>
<td valign="top" align="center">2538</td>
<td valign="top" align="center">23.15%</td>
<td valign="top" align="center">&#x3010;20%-30%)</td>
<td valign="top" align="center">13.88%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">51</td>
<td valign="top" align="center">chr19</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">20847619</td>
<td valign="top" align="center">20850034</td>
<td valign="top" align="center">2416</td>
<td valign="top" align="center">22.88%</td>
<td valign="top" align="center">&#x3010;20%-30%)</td>
<td valign="top" align="center">2.80%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">52</td>
<td valign="top" align="center">chr8</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">11324731</td>
<td valign="top" align="center">11327317</td>
<td valign="top" align="center">2587</td>
<td valign="top" align="center">22.77%</td>
<td valign="top" align="center">&#x3010;20%-30%)</td>
<td valign="top" align="center">15.32%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">53</td>
<td valign="top" align="center">chr1</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">31825639</td>
<td valign="top" align="center">31827932</td>
<td valign="top" align="center">2294</td>
<td valign="top" align="center">21.66%</td>
<td valign="top" align="center">&#x3010;20%-30%)</td>
<td valign="top" align="center">44.57%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">54</td>
<td valign="top" align="center">chr2B</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">5807936</td>
<td valign="top" align="center">5810201</td>
<td valign="top" align="center">2266</td>
<td valign="top" align="center">21.54%</td>
<td valign="top" align="center">&#x3010;20%-30%)</td>
<td valign="top" align="center">5.44%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">55</td>
<td valign="top" align="center">chr4</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">49398166</td>
<td valign="top" align="center">49400489</td>
<td valign="top" align="center">2324</td>
<td valign="top" align="center">21.00%</td>
<td valign="top" align="center">&#x3010;20%-30%)</td>
<td valign="top" align="center">14.29%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">56</td>
<td valign="top" align="center">chr15</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">19096168</td>
<td valign="top" align="center">19099630</td>
<td valign="top" align="center">3463</td>
<td valign="top" align="center">20.90%</td>
<td valign="top" align="center">&#x3010;20%-30%)</td>
<td valign="top" align="center">21.64%</td>
<td valign="top" align="center">Insertion,Deletion</td>
<td valign="top" align="center">genic&amp;intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">57</td>
<td valign="top" align="center">chr4</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">162706670</td>
<td valign="top" align="center">162708848</td>
<td valign="top" align="center">2179</td>
<td valign="top" align="center">20.70%</td>
<td valign="top" align="center">&#x3010;20%-30%)</td>
<td valign="top" align="center">5.49%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">58</td>
<td valign="top" align="center">chr2B</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">100074966</td>
<td valign="top" align="center">100077139</td>
<td valign="top" align="center">2174</td>
<td valign="top" align="center">20.56%</td>
<td valign="top" align="center">&#x3010;20%-30%)</td>
<td valign="top" align="center">5.31%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intron</td>
</tr>
<tr>
<td valign="middle" align="left">59</td>
<td valign="top" align="center">chr18</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">44459897</td>
<td valign="top" align="center">44461968</td>
<td valign="top" align="center">2072</td>
<td valign="top" align="center">19.48%</td>
<td valign="top" align="center">&#x3010;10%-20%)</td>
<td valign="top" align="center">0.54%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">60</td>
<td valign="top" align="center">chr19</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">25500990</td>
<td valign="top" align="center">25503068</td>
<td valign="top" align="center">2079</td>
<td valign="top" align="center">19.47%</td>
<td valign="top" align="center">&#x3010;10%-20%)</td>
<td valign="top" align="center">2.58%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">61</td>
<td valign="top" align="center">chr14</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">71784651</td>
<td valign="top" align="center">71786596</td>
<td valign="top" align="center">1946</td>
<td valign="top" align="center">18.45%</td>
<td valign="top" align="center">&#x3010;10%-20%)</td>
<td valign="top" align="center">8.25%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intron</td>
</tr>
<tr>
<td valign="middle" align="left">62</td>
<td valign="top" align="center">chr4</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">55246241</td>
<td valign="top" align="center">55248103</td>
<td valign="top" align="center">1863</td>
<td valign="top" align="center">17.68%</td>
<td valign="top" align="center">&#x3010;10%-20%)</td>
<td valign="top" align="center">10.87%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">63</td>
<td valign="top" align="center">chr6</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">58293089</td>
<td valign="top" align="center">58294835</td>
<td valign="top" align="center">1747</td>
<td valign="top" align="center">16.57%</td>
<td valign="top" align="center">&#x3010;10%-20%)</td>
<td valign="top" align="center">0.63%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">64</td>
<td valign="top" align="center">chr13</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">59301174</td>
<td valign="top" align="center">59302916</td>
<td valign="top" align="center">1743</td>
<td valign="top" align="center">16.29%</td>
<td valign="top" align="center">&#x3010;10%-20%)</td>
<td valign="top" align="center">6.77%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">65</td>
<td valign="top" align="center">chr11</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">49783110</td>
<td valign="top" align="center">49784802</td>
<td valign="top" align="center">1693</td>
<td valign="top" align="center">15.89%</td>
<td valign="top" align="center">&#x3010;10%-20%)</td>
<td valign="top" align="center">2.00%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">66</td>
<td valign="top" align="center">chr2A</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">77283713</td>
<td valign="top" align="center">77285331</td>
<td valign="top" align="center">1619</td>
<td valign="top" align="center">15.17%</td>
<td valign="top" align="center">&#x3010;10%-20%)</td>
<td valign="top" align="center">1.55%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intron</td>
</tr>
<tr>
<td valign="middle" align="left">67</td>
<td valign="top" align="center">chr2B</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">97034956</td>
<td valign="top" align="center">97036587</td>
<td valign="top" align="center">1632</td>
<td valign="top" align="center">15.12%</td>
<td valign="top" align="center">&#x3010;10%-20%)</td>
<td valign="top" align="center">14.74%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">68</td>
<td valign="top" align="center">chr5_NW_019932883v1_random</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">1485086</td>
<td valign="top" align="center">1486708</td>
<td valign="top" align="center">1623</td>
<td valign="top" align="center">14.83%</td>
<td valign="top" align="center">&#x3010;10%-20%)</td>
<td valign="top" align="center">17.16%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">69</td>
<td valign="top" align="center">chr4</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">50892584</td>
<td valign="top" align="center">50893971</td>
<td valign="top" align="center">1388</td>
<td valign="top" align="center">12.91%</td>
<td valign="top" align="center">&#x3010;10%-20%)</td>
<td valign="top" align="center">15.64%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intron</td>
</tr>
<tr>
<td valign="middle" align="left">70</td>
<td valign="top" align="center">chrY</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">14091617</td>
<td valign="top" align="center">14092838</td>
<td valign="top" align="center">1222</td>
<td valign="top" align="center">11.28%</td>
<td valign="top" align="center">&#x3010;10%-20%)</td>
<td valign="top" align="center">4.13%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">71</td>
<td valign="top" align="center">chrY</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">5451943</td>
<td valign="top" align="center">5453164</td>
<td valign="top" align="center">1222</td>
<td valign="top" align="center">11.28%</td>
<td valign="top" align="center">&#x3010;10%-20%)</td>
<td valign="top" align="center">4.13%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">72</td>
<td valign="top" align="center">chrX</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">46463406</td>
<td valign="top" align="center">46464551</td>
<td valign="top" align="center">1146</td>
<td valign="top" align="center">10.90%</td>
<td valign="top" align="center">&#x3010;10%-20%)</td>
<td valign="top" align="center">16.33%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">73</td>
<td valign="top" align="center">chrY</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">1087726</td>
<td valign="top" align="center">1088806</td>
<td valign="top" align="center">1081</td>
<td valign="top" align="center">10.28%</td>
<td valign="top" align="center">&#x3010;10%-20%)</td>
<td valign="top" align="center">0.83%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">74</td>
<td valign="top" align="center">chr5</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">32949251</td>
<td valign="top" align="center">32950412</td>
<td valign="top" align="center">1162</td>
<td valign="top" align="center">9.90%</td>
<td valign="top" align="center">&#x3010;0%-10%)</td>
<td valign="top" align="center">11.51%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">75</td>
<td valign="top" align="center">chr10</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">77164804</td>
<td valign="top" align="center">77165954</td>
<td valign="top" align="center">1151</td>
<td valign="top" align="center">9.65%</td>
<td valign="top" align="center">&#x3010;0%-10%)</td>
<td valign="top" align="center">13.06%</td>
<td valign="top" align="center">Deletion</td>
<td valign="top" align="center">intergenic</td>
</tr>
<tr>
<td valign="middle" align="left">76</td>
<td valign="top" align="center">chr1</td>
<td valign="top" align="center">+</td>
<td valign="top" align="center">104828192</td>
<td valign="top" align="center">104829066</td>
<td valign="top" align="center">875</td>
<td valign="top" align="center">8.14%</td>
<td valign="top" align="center">&#x3010;0%-10%)</td>
<td valign="top" align="center">2.18%</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">intergenic</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>&#x201c;-&#x201d; indicates antisense strand, &#x201c;+&#x201d; represents sense strand, and &#x201c;NA&#x201d; stands for Not Applicable.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>We did not find any solo HML-8 LTRs in the chimpanzee genome which is distinct from our findings in the human genome where there were 5 solo HML-8 LTRs. Although being short (approximately 75% of the representative reference MER11A), 5 solo LTRs exist in human genome. The nucleotide sequence of each proviral element is shown in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Dataset 1</bold>
</xref>. The underlying distribution of HML-8 elements in the chimpanzee genome is shown in <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1A</bold>
</xref>.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Chromosomal distribution of the HML-8 loci in the chimpanzee genome. <bold>(A)</bold> All the HML-8 elements (red arrows) are displayed on the chimpanzee karyotype (<uri xlink:href="http://www.ensembl.org">http://www.ensembl.org</uri>). <bold>(B)</bold> The number of HML-8 proviral elements integrated into each Chimpanzee chromosome was determined and compared to the expected number of insertion events. The expected number of sequences in each chromosome is marked in blue, and the actual number of detected sequences is marked in orange.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-14-1349046-g001.tif"/>
</fig>
<p>Furthermore, the expected number of HML-8 proviral elements in each chimpanzee chromosome was predicted. The expected number of HML-8 loci was subsequently compared with the actual number of HML-8 loci detected on each chimpanzee chromosome to evaluate whether HML-8 was randomly distributed in the chimpanzee genome. The results indicated that the number of observed HML-8 distribution events was significantly inconsistent with what was expected, thus supporting the nonrandom integration of HML-8 in the genome (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1B</bold>
</xref>). For proviral elements, the number of HML-8 insertions on chromosomes 4, 11, 19, and Y was greater than expected. In particular, the number of HML-8 proviral elements on the Y chromosome was 12 times greater than expected. In contrast, on chromosomes 3, 6, 7, 9, 10, 13, 14, 15, 16, 17, 18 and 20, the number of HML-8 locus integrations was lower than expected. Notably, we did not detect any HML-8 proviral integrations on chromosome 21 (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1B</bold>
</xref>). The analysis clearly showed that the integration of HML-8 into the chimpanzee genome was nonrandom. Furthermore, all 76 identified proviral elements were analyzed to determine their locations in intergenic regions, introns, or exons. The results showed that 59 proviral elements were located in intergenic regions, accounting for 77.63%; 14 proviral elements were located in introns, accounting for 18.42%; 2 proviral elements were located in both genic and intergenic regions, accounting for 2.63% (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). Brady et&#xa0;al. previously validated that the accumulation of HML-2 proviruses in introns and intergenic regions is a selection against proviruses that integrate into exons and genic regions rather than a result of integration preference (<xref ref-type="bibr" rid="B5">Brady et&#xa0;al., 2009</xref>). Our study similarly revealed a nonrandom distribution and apparent bias for insertions into intergenic regions and introns.</p>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Structural characterization</title>
<p>The analysis of the structural features of all 76 HML-8 proviruses, such as deletion and insertion events, can characterize the uniqueness of each proviral element and assess the potential for active expression. Thus, to define the structural characteristics of HML-8, the 76 proviral elements were first compared to the complete HML-8 reference (MER11A-HERVK11-MER11A). According to the annotation information in the Dfam database (<ext-link ext-link-type="uri" xlink:href="https://www.dfam.org/family/DF0000193/features">https://www.dfam.org/family/DF0000193/features</ext-link>), the complete HML-8 reference exhibited a typical proviral structure containing 4 open reading frames (ORFs) and 2 flanking LTRs. Specifically, the 5&#x2019; LTR is located between nucleotides 1-1266, the coding sequence (CDS) range of the HERVK11 <italic>gag</italic> protein is from nucleotides 1422-3530, the CDS range of the HERVK11 <italic>pro</italic> protein is from nucleotides 3341-4345, the CDS range of the HERVK11 <italic>pol</italic> protein is from nucleotides 4303-7032, the CDS range of the HERVK11 <italic>env</italic> protein is from nucleotides 6890-9217, and the 3&#x2019; LTR is located between nucleotides 9220-10485.</p>
<p>All 76 HML-8 proviral sequences were aligned, and the positions of the insertions and deletions were annotated to describe the structure of each HML-8 provirus element (<xref ref-type="fig" rid="f2">
<bold>Figures&#xa0;2</bold>
</xref>, <xref ref-type="fig" rid="f3">
<bold>3</bold>
</xref>). We grouped HML-8 proviral loci based on their alignment to the consensus sequence. We found that all HML-8 loci in the chimpanzee genome were incomplete and lacked either some part of an LTR, internal coding sequences, or both. Among them, only 9 elements, including HML-8 chr11:97063674-97072831, chr19: 23582963-23597406, chr17:28556159-28565079, chr1:156345936-156354251, chr9:31695596-31703805, chr5:52655093-52662923, chr19:25615095-25622844, chr12:51714625-51722440, and chr6:73941843-73949302, were longer than 70% of the complete reference sequence in length and showed the typical proviral structure (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>).</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>HML-8 proviruses structural characterization of elements 1-38. The front (1-38) HML-8 provirus elements were analyzed and compared with the Dfam reference sequence. All insertions and deletions have been annotated, as reported in the figure legend. The way the loci were grouped depended on the range of their sequence match to the consensus sequence.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-14-1349046-g002.tif"/>
</fig>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>HML-8 proviruses structural characterization of elements 39-76. The following (39-76) HML-8 provirus elements were analyzed and compared with the Dfam reference sequence. All insertions and deletions have been annotated, as reported in the figure legend. The way the loci were grouped depended on the range of their sequence match to the consensus sequence.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-14-1349046-g003.tif"/>
</fig>
<p>Additionally, <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref> summarizes the integrity of the 6 separate regions relative to the corresponding sections of the HML-8 reference sequence (5&#x2019; LTR, <italic>gag</italic>, <italic>pro</italic>, <italic>pol</italic>, <italic>env</italic>, and 3&#x2019; LTR), respectively. The results showed that among all 76 proviral elements, the 5&#x2019; LTR regions of 63 were missing. The longest 5&#x2019; LTR included 1023 base pairs out of 1266 base pairs (80.81%) relative to the corresponding reference region. The shortest 5&#x2019; LTR included 179 base pairs out of 1266 base pairs (14.14%). The remaining 11 5&#x2019; LTRs ranged from 33.49%-76.54% (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). The 5&#x2019; LTR plays a crucial role in virus transcription and replication. Due to the truncation of the HML-8 proviral LTR sequences, it is unlikely these proviruses are actively expressed or able to retrotranspose into new locations in the chimpanzee genome. Among all 76 proviral elements, 43 <italic>gag</italic> regions have been deleted. The shortest <italic>gag</italic> gene accounts for 0.52%. The 15 <italic>gag</italic> loci range from 90.04%-99.72%. The remaining 17 <italic>gag</italic> loci ranged from 5.22%-86.58% (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). Among all 76 proviral elements, 34 <italic>pro</italic> regions have been deleted. The shortest <italic>pro</italic> gene accounts for 3.28%. The 17 <italic>pro</italic> loci ranged from 91.84%-99.90%. The remaining 22 <italic>pro</italic> loci ranged from 7.06%-88.06% (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). Among all 76 proviral elements, 19 <italic>pol</italic> regions have been deleted. The shortest <italic>pol</italic> gene accounted for 2.67%. The 15 <italic>pol</italic> loci range from 92.89%-99.82%. The remaining 41 <italic>pol</italic> loci ranged from 5.13%-78.46%. Among all 76 proviral elements, 11 <italic>env</italic> regions have been deleted. The shortest <italic>env</italic> gene accounted for 0.09%. The 33 <italic>env</italic> loci ranged from 90.21%-99.70%. The remaining 31 <italic>env</italic> loci ranged from 13.57%-89.99%. Among all 76 proviral elements, 25 3&#x2019; LTR regions have been deleted. The longest 3&#x2019; LTR element accounted for 41.47%. The shortest 3&#x2019; LTR element accounted for 3.40%. The remaining 49 3&#x2019; LTR loci ranged from 6.32%-40.84%. In summary, 63 5&#x2019; LTRs, 43 <italic>gag</italic> regions, 34 <italic>pro</italic> regions, 19 <italic>pol</italic> regions, 11 <italic>env</italic> regions, and 25 3&#x2019; LTR regions have been completely deleted. The loss of the 5&#x2019; LTR was the most severe and was much greater than that of the 3&#x2019; LTR. The 5&#x2019; LTR plays a crucial role in the transcription and replication of viruses. Therefore, the consistent truncation of the HML-8 5&#x2019; LTRs likely significantly impedes their expression and retrotransposition activity in the chimpanzee genome. In contrast, the <italic>env</italic> region has the smallest degree of absence. Only 11 have been deleted. Forty-four out of the 76 <italic>env</italic> regions accounted for &#x2265;70.75%. Interestingly, a similar situation was also observed in human genome, suggesting that HML-8 was integrated before the divergence of human and chimpanzee ancestors. In the human genome, among all 40 proviral elements, 28 5&#x2019; LTR regions have been deleted. The longest 5&#x2019; LTR accounted for 73.93% of the total length relative to the corresponding reference region. The shortest 5&#x2019; LTR accounted for 28.2%. The remaining 10 5&#x2019; LTRs ranged from 32.94%-73.14%. Among all 40 proviral elements, the <italic>gag</italic> regions of 17 have been deleted. The shortest <italic>gag</italic> accounts for 39.02%. The 12 <italic>gag</italic> regions ranged from 92.89%-99.95%. The remaining 10 gag regions ranged from 49.64%-81.41%. Among all 40 proviral elements, the <italic>pro</italic> region of 12 was deleted. There were 3 complete <italic>pro</italic> regions. The shortest <italic>pro</italic> accounted for 8.06%. The 12 <italic>pro</italic> regions ranged from 94.93%-99.5%. The remaining 12 ranged from 13.23%-88.46%. Among all 40 proviral elements, the <italic>pol</italic> region of 6 was deleted. The shortest <italic>pol</italic> accounted for 6.7%. The 10 <italic>pol</italic> regions ranged from 93.33%-99.89%. The remaining 23 <italic>pol</italic> regions ranged from 10.29%- 78.35%. Among all 40 proviral elements, the <italic>env</italic> region of 6 has been deleted. The shortest <italic>env</italic> gene accounted for 13.57%. The 15 <italic>env</italic> loci ranged from 90.16%-99.05%. The remaining 18 <italic>env</italic> loci ranged from 30.07%- 89.73%. Among all 40 proviral elements, the 3&#x2019; LTR region of 16 was missing. The longest 3&#x2019; LTR accounted for 75.36%. The shortest 3&#x2019; LTR accounted for 8.93%. The remaining 22 3&#x2019; LTRs ranged from 9.64%-44.71%. In summary, 28 5&#x2019; LTR regions, 17 <italic>gag</italic> regions, 12 <italic>pro</italic> regions, 6 <italic>pol</italic> regions, 6 <italic>env</italic> regions, and 16 3&#x2019; LTR regions were completely missing.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>The integrity of 6 separate regions relative to the corresponding sections of reference.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Number</th>
<th valign="top" align="center">Provirus Regions</th>
<th valign="top" align="center">5&#x2019;LTR(%)</th>
<th valign="top" align="center">gag(%)</th>
<th valign="top" align="center">pro(%)</th>
<th valign="top" align="center">pol(%)</th>
<th valign="top" align="center">env(%)</th>
<th valign="top" align="center">3&#x2019;LTR(%)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">1</td>
<td valign="top" align="center">chr11 97063674 97072831</td>
<td valign="top" align="center">48.66%</td>
<td valign="top" align="center">99.67%</td>
<td valign="top" align="center">100.00%</td>
<td valign="top" align="center">99.71%</td>
<td valign="top" align="center">99.40%</td>
<td valign="top" align="center">40.36%</td>
</tr>
<tr>
<td valign="top" align="left">2</td>
<td valign="top" align="center">chr19 23582963 23597406</td>
<td valign="top" align="center">38.86%</td>
<td valign="top" align="center">99.43%</td>
<td valign="top" align="center">99.40%</td>
<td valign="top" align="center">97.66%</td>
<td valign="top" align="center">98.15%</td>
<td valign="top" align="center">37.12%</td>
</tr>
<tr>
<td valign="top" align="left">3</td>
<td valign="top" align="center">chr17 28556159 28565079</td>
<td valign="top" align="center">66.11%</td>
<td valign="top" align="center">99.29%</td>
<td valign="top" align="center">98.71%</td>
<td valign="top" align="center">97.25%</td>
<td valign="top" align="center">90.89%</td>
<td valign="top" align="center">32.86%</td>
</tr>
<tr>
<td valign="top" align="left">4</td>
<td valign="top" align="center">chr1 156345936 156354251</td>
<td valign="top" align="center">50.08%</td>
<td valign="top" align="center">72.83%</td>
<td valign="top" align="center">65.77%</td>
<td valign="top" align="center">95.20%</td>
<td valign="top" align="center">99.57%</td>
<td valign="top" align="center">36.41%</td>
</tr>
<tr>
<td valign="top" align="left">5</td>
<td valign="top" align="center">chr9 31695596 31703805</td>
<td valign="top" align="center">80.81%</td>
<td valign="top" align="center">99.72%</td>
<td valign="top" align="center">99.70%</td>
<td valign="top" align="center">99.67%</td>
<td valign="top" align="center">67.48%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">6</td>
<td valign="top" align="center">chr5 52655093 52662923</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">92.79%</td>
<td valign="top" align="center">98.91%</td>
<td valign="top" align="center">99.45%</td>
<td valign="top" align="center">90.89%</td>
<td valign="top" align="center">30.65%</td>
</tr>
<tr>
<td valign="top" align="left">7</td>
<td valign="top" align="center">chr19 25615095 25622844</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">93.22%</td>
<td valign="top" align="center">100.00%</td>
<td valign="top" align="center">97.07%</td>
<td valign="top" align="center">90.81%</td>
<td valign="top" align="center">28.99%</td>
</tr>
<tr>
<td valign="top" align="left">8</td>
<td valign="top" align="center">chr12 51714625 51722440</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">93.12%</td>
<td valign="top" align="center">99.80%</td>
<td valign="top" align="center">99.74%</td>
<td valign="top" align="center">91.07%</td>
<td valign="top" align="center">28.99%</td>
</tr>
<tr>
<td valign="top" align="left">9</td>
<td valign="top" align="center">chr6 73941843 73949302</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">85.44%</td>
<td valign="top" align="center">99.90%</td>
<td valign="top" align="center">99.60%</td>
<td valign="top" align="center">90.68%</td>
<td valign="top" align="center">15.01%</td>
</tr>
<tr>
<td valign="top" align="left">10</td>
<td valign="top" align="center">chr9 84591713 84599232</td>
<td valign="top" align="center">75.20%</td>
<td valign="top" align="center">99.67%</td>
<td valign="top" align="center">99.30%</td>
<td valign="top" align="center">30.92%</td>
<td valign="top" align="center">99.27%</td>
<td valign="top" align="center">36.97%</td>
</tr>
<tr>
<td valign="top" align="left">11</td>
<td valign="top" align="center">chr3 79615035 79622061</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">93.65%</td>
<td valign="top" align="center">98.31%</td>
<td valign="top" align="center">65.97%</td>
<td valign="top" align="center">90.42%</td>
<td valign="top" align="center">41.47%</td>
</tr>
<tr>
<td valign="top" align="left">12</td>
<td valign="top" align="center">chrX 56602551 56609242</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">91.80%</td>
<td valign="top" align="center">99.00%</td>
<td valign="top" align="center">99.16%</td>
<td valign="top" align="center">61.04%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">13</td>
<td valign="top" align="center">chr1 135696367 135712562</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">36.65%</td>
<td valign="top" align="center">96.02%</td>
<td valign="top" align="center">99.23%</td>
<td valign="top" align="center">89.52%</td>
<td valign="top" align="center">35.23%</td>
</tr>
<tr>
<td valign="top" align="left">14</td>
<td valign="top" align="center">chr11 63656712 63663509</td>
<td valign="top" align="center">75.91%</td>
<td valign="top" align="center">70.22%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">57.33%</td>
<td valign="top" align="center">99.31%</td>
<td valign="top" align="center">9.64%</td>
</tr>
<tr>
<td valign="top" align="left">15</td>
<td valign="top" align="center">chr2A 64123614 64129736</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">69.27%</td>
<td valign="top" align="center">77.51%</td>
<td valign="top" align="center">62.97%</td>
<td valign="top" align="center">90.51%</td>
<td valign="top" align="center">32.86%</td>
</tr>
<tr>
<td valign="top" align="left">16</td>
<td valign="top" align="center">chr3 128565266 128571536</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">93.84%</td>
<td valign="top" align="center">51.14%</td>
<td valign="top" align="center">57.99%</td>
<td valign="top" align="center">91.19%</td>
<td valign="top" align="center">30.65%</td>
</tr>
<tr>
<td valign="top" align="left">17</td>
<td valign="top" align="center">chr12 81696811 81702819</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">77.15%</td>
<td valign="top" align="center">56.02%</td>
<td valign="top" align="center">99.82%</td>
<td valign="top" align="center">54.90%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">18</td>
<td valign="top" align="center">chr11 49590235 49596119</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">49.88%</td>
<td valign="top" align="center">99.90%</td>
<td valign="top" align="center">99.56%</td>
<td valign="top" align="center">59.66%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">19</td>
<td valign="top" align="center">chr10 98677603 98683109</td>
<td valign="top" align="center">50.00%</td>
<td valign="top" align="center">99.62%</td>
<td valign="top" align="center">25.97%</td>
<td valign="top" align="center">10.07%</td>
<td valign="top" align="center">98.71%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">20</td>
<td valign="top" align="center">chr1 108430301 108435591</td>
<td valign="top" align="center">76.54%</td>
<td valign="top" align="center">99.29%</td>
<td valign="top" align="center">98.81%</td>
<td valign="top" align="center">17.11%</td>
<td valign="top" align="center">39.65%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">21</td>
<td valign="top" align="center">chrY 23381750 23386956</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">86.58%</td>
<td valign="top" align="center">78.61%</td>
<td valign="top" align="center">24.21%</td>
<td valign="top" align="center">95.83%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">22</td>
<td valign="top" align="center">chr11 50352478 50357771</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">14.93%</td>
<td valign="top" align="center">99.34%</td>
<td valign="top" align="center">90.64%</td>
<td valign="top" align="center">38.47%</td>
</tr>
<tr>
<td valign="top" align="left">23</td>
<td valign="top" align="center">chr11 49637737 49642530</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">51.07%</td>
<td valign="top" align="center">99.80%</td>
<td valign="top" align="center">41.17%</td>
<td valign="top" align="center">65.42%</td>
<td valign="top" align="center">22.20%</td>
</tr>
<tr>
<td valign="top" align="left">24</td>
<td valign="top" align="center">chr4 137449286 137454131</td>
<td valign="top" align="center">33.49%</td>
<td valign="top" align="center">75.30%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">14.91%</td>
<td valign="top" align="center">88.53%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">25</td>
<td valign="top" align="center">chr12 102968149 102972730</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">78.46%</td>
<td valign="top" align="center">91.15%</td>
<td valign="top" align="center">35.70%</td>
</tr>
<tr>
<td valign="top" align="left">26</td>
<td valign="top" align="center">chr3 109740319 109744759</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.52%</td>
<td valign="top" align="center">82.19%</td>
<td valign="top" align="center">36.52%</td>
<td valign="top" align="center">99.70%</td>
<td valign="top" align="center">37.20%</td>
</tr>
<tr>
<td valign="top" align="left">27</td>
<td valign="top" align="center">chr11 14869711 14874159</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">33.33%</td>
<td valign="top" align="center">63.85%</td>
<td valign="top" align="center">91.07%</td>
<td valign="top" align="center">33.10%</td>
</tr>
<tr>
<td valign="top" align="left">28</td>
<td valign="top" align="center">chr4 64843173 64847502</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">70.18%</td>
<td valign="top" align="center">99.61%</td>
<td valign="top" align="center">18.01%</td>
</tr>
<tr>
<td valign="top" align="left">29</td>
<td valign="top" align="center">chrX 34789238 34793597</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">16.02%</td>
<td valign="top" align="center">64.10%</td>
<td valign="top" align="center">90.85%</td>
<td valign="top" align="center">40.28%</td>
</tr>
<tr>
<td valign="top" align="left">30</td>
<td valign="top" align="center">chr8 44511870 44516437</td>
<td valign="top" align="center">14.14%</td>
<td valign="top" align="center">90.04%</td>
<td valign="top" align="center">99.60%</td>
<td valign="top" align="center">48.39%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">31</td>
<td valign="top" align="center">chr6 155777868 155781847</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">92.89%</td>
<td valign="top" align="center">67.65%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">32</td>
<td valign="top" align="center">chr19 24073629 24078094</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">82.12%</td>
<td valign="top" align="center">99.80%</td>
<td valign="top" align="center">56.92%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">33</td>
<td valign="top" align="center">chr4 77803811 77807756</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">55.72%</td>
<td valign="top" align="center">41.87%</td>
<td valign="top" align="center">90.46%</td>
<td valign="top" align="center">24.41%</td>
</tr>
<tr>
<td valign="top" align="left">34</td>
<td valign="top" align="center">chr8 12333790 12337817</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">61.68%</td>
<td valign="top" align="center">90.59%</td>
<td valign="top" align="center">28.83%</td>
</tr>
<tr>
<td valign="top" align="left">35</td>
<td valign="top" align="center">chr7 6075204 6079128</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">59.12%</td>
<td valign="top" align="center">90.94%</td>
<td valign="top" align="center">26.15%</td>
</tr>
<tr>
<td valign="top" align="left">36</td>
<td valign="top" align="center">chr8 43749874 43753733</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">34.03%</td>
<td valign="top" align="center">41.47%</td>
<td valign="top" align="center">90.34%</td>
<td valign="top" align="center">35.55%</td>
</tr>
<tr>
<td valign="top" align="left">37</td>
<td valign="top" align="center">chrY 6360429 6370254</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">34.03%</td>
<td valign="top" align="center">41.98%</td>
<td valign="top" align="center">89.99%</td>
<td valign="top" align="center">28.99%</td>
</tr>
<tr>
<td valign="top" align="left">38</td>
<td valign="top" align="center">chr8 86619640 86623356</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">3.28%</td>
<td valign="top" align="center">62.45%</td>
<td valign="top" align="center">70.75%</td>
<td valign="top" align="center">35.70%</td>
</tr>
<tr>
<td valign="top" align="left">39</td>
<td valign="top" align="center">chr20 29240803 29250628</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">34.03%</td>
<td valign="top" align="center">41.98%</td>
<td valign="top" align="center">89.99%</td>
<td valign="top" align="center">28.99%</td>
</tr>
<tr>
<td valign="top" align="left">40</td>
<td valign="top" align="center">chr4 77195305 77198763</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">45.75%</td>
<td valign="top" align="center">99.01%</td>
<td valign="top" align="center">3.40%</td>
</tr>
<tr>
<td valign="top" align="left">41</td>
<td valign="top" align="center">chr2A 102337670 102341003</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">37.29%</td>
<td valign="top" align="center">90.59%</td>
<td valign="top" align="center">27.33%</td>
</tr>
<tr>
<td valign="top" align="left">42</td>
<td valign="top" align="center">chr5 150548523 150551566</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">19.20%</td>
<td valign="top" align="center">63.77%</td>
<td valign="top" align="center">55.67%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">43</td>
<td valign="top" align="center">chr7 50863865 50867270</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">7.06%</td>
<td valign="top" align="center">64.03%</td>
<td valign="top" align="center">55.93%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">44</td>
<td valign="top" align="center">chr1 45743923 45746943</td>
<td valign="top" align="center">45.26%</td>
<td valign="top" align="center">99.43%</td>
<td valign="top" align="center">37.61%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">45</td>
<td valign="top" align="center">chrX 41627863 41630750</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">17.62%</td>
<td valign="top" align="center">90.72%</td>
<td valign="top" align="center">33.81%</td>
</tr>
<tr>
<td valign="top" align="left">46</td>
<td valign="top" align="center">chrX 42154219 42156882</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">6.96%</td>
<td valign="top" align="center">90.46%</td>
<td valign="top" align="center">38.63%</td>
</tr>
<tr>
<td valign="top" align="left">47</td>
<td valign="top" align="center">chr22 1446161 1448721</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">86.39%</td>
<td valign="top" align="center">88.06%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">48</td>
<td valign="top" align="center">chr16 44723847 44726410</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">5.13%</td>
<td valign="top" align="center">90.21%</td>
<td valign="top" align="center">35.86%</td>
</tr>
<tr>
<td valign="top" align="left">49</td>
<td valign="top" align="center">chrY 3095532 3098114</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">6.59%</td>
<td valign="top" align="center">90.89%</td>
<td valign="top" align="center">33.18%</td>
</tr>
<tr>
<td valign="top" align="left">50</td>
<td valign="top" align="center">chrY 13438427 13440964</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">6.92%</td>
<td valign="top" align="center">90.51%</td>
<td valign="top" align="center">29.62%</td>
</tr>
<tr>
<td valign="top" align="left">51</td>
<td valign="top" align="center">chr19 20847619 20850034</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">37.55%</td>
<td valign="top" align="center">99.90%</td>
<td valign="top" align="center">31.21%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">52</td>
<td valign="top" align="center">chr8 11324731 11327317</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">8.86%</td>
<td valign="top" align="center">91.02%</td>
<td valign="top" align="center">28.75%</td>
</tr>
<tr>
<td valign="top" align="left">53</td>
<td valign="top" align="center">chr1 31825639 31827932</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">34.03%</td>
<td valign="top" align="center">42.01%</td>
<td valign="top" align="center">42.53%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">54</td>
<td valign="top" align="center">chr2B 5807936 5810201</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">77.15%</td>
<td valign="top" align="center">36.89%</td>
</tr>
<tr>
<td valign="top" align="left">55</td>
<td valign="top" align="center">chr4 49398166 49400489</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">80.37%</td>
<td valign="top" align="center">35.15%</td>
</tr>
<tr>
<td valign="top" align="left">56</td>
<td valign="top" align="center">chr15 19096168 19099630</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">2.67%</td>
<td valign="top" align="center">82.04%</td>
<td valign="top" align="center">32.62%</td>
</tr>
<tr>
<td valign="top" align="left">57</td>
<td valign="top" align="center">chr4 162706670 162708848</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">77.32%</td>
<td valign="top" align="center">29.70%</td>
</tr>
<tr>
<td valign="top" align="left">58</td>
<td valign="top" align="center">chr2B 100074966 100077139</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">87.84%</td>
<td valign="top" align="center">9.95%</td>
</tr>
<tr>
<td valign="top" align="left">59</td>
<td valign="top" align="center">chr18 44459897 44461968</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">84.75%</td>
<td valign="top" align="center">6.32%</td>
</tr>
<tr>
<td valign="top" align="left">60</td>
<td valign="top" align="center">chr19 25500990 25503068</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">84.87%</td>
<td valign="top" align="center">47.56%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">61</td>
<td valign="top" align="center">chr14 71784651 71786596</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">61.25%</td>
<td valign="top" align="center">40.84%</td>
</tr>
<tr>
<td valign="top" align="left">62</td>
<td valign="top" align="center">chr4 55246241 55248103</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">33.93%</td>
<td valign="top" align="center">57.33%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">63</td>
<td valign="top" align="center">chr6 58293089 58294835</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">5.22%</td>
<td valign="top" align="center">91.84%</td>
<td valign="top" align="center">31.61%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">64</td>
<td valign="top" align="center">chr13 59301174 59302916</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">53.91%</td>
<td valign="top" align="center">37.28%</td>
</tr>
<tr>
<td valign="top" align="left">65</td>
<td valign="top" align="center">chr11 49783110 49784802</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">61.94%</td>
<td valign="top" align="center">0.09%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">66</td>
<td valign="top" align="center">chr2A 77283713 77285331</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">76.72%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">67</td>
<td valign="top" align="center">chr2B 97034956 97036587</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">54.17%</td>
<td valign="top" align="center">28.83%</td>
</tr>
<tr>
<td valign="top" align="left">68</td>
<td valign="top" align="center">chr5_NW_019932883v1_random 1485086 1486708</td>
<td valign="top" align="center">48.97%</td>
<td valign="top" align="center">39.26%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">69</td>
<td valign="top" align="center">chr4 50892584 50893971</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">54.25%</td>
<td valign="top" align="center">9.56%</td>
</tr>
<tr>
<td valign="top" align="left">70</td>
<td valign="top" align="center">chrY 14091617 14092838</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">41.92%</td>
<td valign="top" align="center">19.04%</td>
</tr>
<tr>
<td valign="top" align="left">71</td>
<td valign="top" align="center">chrY 5451943 5453164</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">41.92%</td>
<td valign="top" align="center">19.04%</td>
</tr>
<tr>
<td valign="top" align="left">72</td>
<td valign="top" align="center">chrX 46463406 46464551</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">34.03%</td>
<td valign="top" align="center">30.99%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
</tr>
<tr>
<td valign="top" align="left">73</td>
<td valign="top" align="center">chrY 1087726 1088806</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">41.92%</td>
<td valign="top" align="center">8.06%</td>
</tr>
<tr>
<td valign="top" align="left">74</td>
<td valign="top" align="center">chr5 32949251 32950412</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">30.03%</td>
<td valign="top" align="center">35.70%</td>
</tr>
<tr>
<td valign="top" align="left">75</td>
<td valign="top" align="center">chr10 77164804 77165954</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">26.63%</td>
<td valign="top" align="center">39.89%</td>
</tr>
<tr>
<td valign="top" align="left">76</td>
<td valign="top" align="center">chr1 104828192 104829066</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">0.00%</td>
<td valign="top" align="center">25.68%</td>
<td valign="top" align="center">13.57%</td>
<td valign="top" align="center">0.00%</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Phylogenetic analyses</title>
<p>To further confirm the assignment of identified HML-8 elements in the chimpanzee genome and characterize their phylogenetic relationships, an ML phylogenetic tree for near-full-length proviruses was first constructed. Three proviral sequences (longer than 80% of the HML-8 reference length) were screened to generate their phylogenetic relationships (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>). Next, 4 ML trees were constructed for subregions whose lengths were longer than 90% of the corresponding section of the reference sequence; these included 15 <italic>gag</italic> elements, 19 <italic>pro</italic> elements, 15 <italic>pol</italic> elements, and 33 <italic>env</italic> elements (<xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;4B&#x2013;E</bold>
</xref>). For comparison, the Dfam HERV-K group (HML-1&#x2013;10) and 3 exogenous betaretroviruses were used as representatives and outgroups, respectively. These phylogenetic groups of different regions of HML-8 were all distinctly separated from the other HERV-K groups (HML1-7, 9-10) (<xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;4A-E</bold>
</xref>). The 3 screened proviruses all clustered with the Dfam HML-8 reference supported by bootstrap support of 100%, indicating that they significantly more likely to be HML-8 than any other HML subtypes (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>). The phylogenetic groups for different regions of HML-8 all clustered together with their corresponding sections of the HML-8 reference, respectively (bootstrap support of 100% for <italic>gag</italic>, <italic>pol</italic>, and <italic>pro</italic>, 92.2% for <italic>env</italic>). Interestingly, two distinct clusters in the <italic>gag</italic> group were identified. The strains were statistically supported by &#x2265;95% of bootstrap values and were named HML-8 type a and type b. The results showed that chr8 44511870 44516437, chr3 79615035 79622061, chr17 28556159 28565079, chrX 56602551 56609242, chr12 51714625 51722440, chr19 25615095 25622844, chr3 128565266 128571536, and chr5 52655093 52662923 were included in type a, whereas chr1 45743923 45746943, chr10 98677603 98683109, chr19 23582963 23597406, chr1 108430301 108435591, chr9 31695596 31703805, chr9 84591713 84599232, and chr11 97063674 97072831 were included in type b. HML-8 type b sequences included the Dfam HML-8 reference, whereas HML-8 type a elements showed more divergence relative to the HML-8 reference. There are no solo LTRs in the chimpanzee genome. Thus, no phylogenetic trees for solo LTRs have been constructed.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Phylogenetic analysis of the HML-8 near-full-length proviruses and 4 subregions by the maximum likelihood method. Phylogenetic analyses of 3 HML-8 proviral elements <bold>(A)</bold>, 15 <italic>gag</italic> elements <bold>(B)</bold>, 19 <italic>pro</italic> elements <bold>(C)</bold>, 15 <italic>pol</italic> elements <bold>(D)</bold>, and 25 <italic>env</italic> elements <bold>(E)</bold>, along with reference sequences. The generated phylogenetic trees were all tested by the bootstrap method with 500 replicates. The branch length indicates the number of substitutions per site. The two intragroup clusters of the <italic>gag</italic> genes (types a and b) were annotated and depicted with different colors, respectively.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-14-1349046-g004.tif"/>
</fig>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Estimated time of integration</title>
<p>Like the distribution dynamics and other characteristics of these remnants, the integration time of each chimpanzee HML-8 member is also a key clue to understanding the evolution of the group across primates. Given the serious lack of intact LTRs of the proviruses, i.e., no provirus has a 5&#x2019; LTR or 3&#x2019; LTR greater than 70%, the proviral LTRs were not used for the integration time calculation as previously described (<xref ref-type="bibr" rid="B19">Jia et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B28">Liu et&#xa0;al., 2023</xref>). Here, we estimated the age of the 46 HML-8 proviral elements in the chimpanzee genome based on the available <italic>gag</italic>, <italic>pro</italic>, <italic>pol</italic>, and <italic>env</italic> regions, respectively (<xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref>). Each region whose length exceeds 90% of the corresponding reference sequence was used to calculate the integration time. Through the formula, an estimate of the integration time (T) can be obtained, namely, T = D/0.2, where D is the percentage of divergent nucleotides and 0.2 represents the host genome neutral mutation rate expressed in substitutions/nucleotide/million years. For each proviral region mentioned above, the ancestral sequences of each region were generated via MEGA7 based on multiple alignments of all the elements and the ML method. The details of the proviral formation periods are shown in <xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref>. Overall, the HML-8 elements (<italic>gag</italic>, <italic>pro</italic>, <italic>pol</italic>, and <italic>env</italic>) found in the chimpanzee genome were integrated between 15 and 52.33 million years ago (mya). The average integration time was 35.86 mya, and the median was 37.25 mya. In our previous study, we performed a comprehensive identification and characterization of the HML-8 group in the human genome (<xref ref-type="bibr" rid="B28">Liu et&#xa0;al., 2023</xref>). Through comparison, it was found that the integration of human HML-8 elements mainly occurred between 23.5 and 52 mya. The average integration time was 37.11 mya, and the median was 37.42 mya. The divergence between human and chimpanzee ancestors is known to trace back to approximately 6.5&#x2013;7.5 mya or earlier. The results indicated that the chimpanzee-specific insertion periods were indeed similar to the human-specific insertion periods and further confirmed that HML-8 was integrated into common ancestors before humans and chimpanzees diverged.</p>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Estimated time of HML-8 elements integration.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" rowspan="2" align="center">Number</th>
<th valign="middle" rowspan="2" align="center">Provirus regions</th>
<th valign="top" colspan="4" align="center">Divergence from Consensus sequence</th>
<th valign="middle" rowspan="2" align="center">Mean Divergences</th>
<th valign="middle" rowspan="2" align="center">T&#x2009;=&#x2009;D/0.2</th>
<th valign="middle" rowspan="2" align="center">Age/ million years (gene vs consensus)</th>
</tr>
<tr>
<th valign="middle" align="center">gag</th>
<th valign="middle" align="center">pro</th>
<th valign="middle" align="center">pol</th>
<th valign="middle" align="center">env</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">1</td>
<td valign="top" align="center">chr11 97063674 97072831</td>
<td valign="top" align="center">0.113</td>
<td valign="top" align="center">0.087</td>
<td valign="top" align="center">0.086</td>
<td valign="top" align="center">0.076</td>
<td valign="top" align="center">0.091</td>
<td valign="top" align="center">0.4525</td>
<td valign="top" align="center">45.25</td>
</tr>
<tr>
<td valign="top" align="center">2</td>
<td valign="top" align="center">chr19 23582963 23597406</td>
<td valign="top" align="center">0.109</td>
<td valign="top" align="center">0.075</td>
<td valign="top" align="center">0.096</td>
<td valign="top" align="center">0.087</td>
<td valign="top" align="center">0.092</td>
<td valign="top" align="center">0.45875</td>
<td valign="top" align="center">45.875</td>
</tr>
<tr>
<td valign="top" align="center">3</td>
<td valign="top" align="center">chr17 28556159 28565079</td>
<td valign="top" align="center">0.064</td>
<td valign="top" align="center">0.062</td>
<td valign="top" align="center">0.077</td>
<td valign="top" align="center">0.054</td>
<td valign="top" align="center">0.064</td>
<td valign="top" align="center">0.32125</td>
<td valign="top" align="center">32.125</td>
</tr>
<tr>
<td valign="top" align="center">4</td>
<td valign="top" align="center">chr1 156345936 156354251</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.092</td>
<td valign="top" align="center">0.070</td>
<td valign="top" align="center">0.081</td>
<td valign="top" align="center">0.405</td>
<td valign="top" align="center">40.5</td>
</tr>
<tr>
<td valign="top" align="center">5</td>
<td valign="top" align="center">chr9 31695596 31703805</td>
<td valign="top" align="center">0.124</td>
<td valign="top" align="center">0.089</td>
<td valign="top" align="center">0.101</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.105</td>
<td valign="top" align="center">0.523333333</td>
<td valign="top" align="center">52.33333333</td>
</tr>
<tr>
<td valign="top" align="center">6</td>
<td valign="top" align="center">chr5 52655093 52662923</td>
<td valign="top" align="center">0.100</td>
<td valign="top" align="center">0.050</td>
<td valign="top" align="center">0.029</td>
<td valign="top" align="center">0.054</td>
<td valign="top" align="center">0.058</td>
<td valign="top" align="center">0.29125</td>
<td valign="top" align="center">29.125</td>
</tr>
<tr>
<td valign="top" align="center">7</td>
<td valign="top" align="center">chr19 25615095 25622844</td>
<td valign="top" align="center">0.099</td>
<td valign="top" align="center">0.071</td>
<td valign="top" align="center">0.039</td>
<td valign="top" align="center">0.068</td>
<td valign="top" align="center">0.069</td>
<td valign="top" align="center">0.34625</td>
<td valign="top" align="center">34.625</td>
</tr>
<tr>
<td valign="top" align="center">8</td>
<td valign="top" align="center">chr12 51714625 51722440</td>
<td valign="top" align="center">0.129</td>
<td valign="top" align="center">0.080</td>
<td valign="top" align="center">0.052</td>
<td valign="top" align="center">0.063</td>
<td valign="top" align="center">0.081</td>
<td valign="top" align="center">0.405</td>
<td valign="top" align="center">40.5</td>
</tr>
<tr>
<td valign="top" align="center">9</td>
<td valign="top" align="center">chr6 73941843 73949302</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.050</td>
<td valign="top" align="center">0.075</td>
<td valign="top" align="center">0.054</td>
<td valign="top" align="center">0.060</td>
<td valign="top" align="center">0.298333333</td>
<td valign="top" align="center">29.83333333</td>
</tr>
<tr>
<td valign="top" align="center">10</td>
<td valign="top" align="center">chr9 84591713 84599232</td>
<td valign="top" align="center">0.109</td>
<td valign="top" align="center">0.091</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.074</td>
<td valign="top" align="center">0.091</td>
<td valign="top" align="center">0.456666667</td>
<td valign="top" align="center">45.66666667</td>
</tr>
<tr>
<td valign="top" align="center">11</td>
<td valign="top" align="center">chr3 79615035 79622061</td>
<td valign="top" align="center">0.048</td>
<td valign="top" align="center">0.054</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.047</td>
<td valign="top" align="center">0.050</td>
<td valign="top" align="center">0.248333333</td>
<td valign="top" align="center">24.83333333</td>
</tr>
<tr>
<td valign="top" align="center">12</td>
<td valign="top" align="center">chrX 56602551 56609242</td>
<td valign="top" align="center">0.068</td>
<td valign="top" align="center">0.059</td>
<td valign="top" align="center">0.065</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.064</td>
<td valign="top" align="center">0.32</td>
<td valign="top" align="center">32</td>
</tr>
<tr>
<td valign="top" align="center">13</td>
<td valign="top" align="center">chr1 135696367 135712562</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.071</td>
<td valign="top" align="center">0.044</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.058</td>
<td valign="top" align="center">0.2875</td>
<td valign="top" align="center">28.75</td>
</tr>
<tr>
<td valign="top" align="center">14</td>
<td valign="top" align="center">chr11 63656712 63663509</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.075</td>
<td valign="top" align="center">0.075</td>
<td valign="top" align="center">0.375</td>
<td valign="top" align="center">37.5</td>
</tr>
<tr>
<td valign="top" align="center">15</td>
<td valign="top" align="center">chr2A 64123614 64129736</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.045</td>
<td valign="top" align="center">0.045</td>
<td valign="top" align="center">0.225</td>
<td valign="top" align="center">22.5</td>
</tr>
<tr>
<td valign="top" align="center">16</td>
<td valign="top" align="center">chr3 128565266 128571536</td>
<td valign="top" align="center">0.088</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.043</td>
<td valign="top" align="center">0.066</td>
<td valign="top" align="center">0.3275</td>
<td valign="top" align="center">32.75</td>
</tr>
<tr>
<td valign="top" align="center">17</td>
<td valign="top" align="center">chr12 81696811 81702819</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.041</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.041</td>
<td valign="top" align="center">0.205</td>
<td valign="top" align="center">20.5</td>
</tr>
<tr>
<td valign="top" align="center">18</td>
<td valign="top" align="center">chr11 49590235 49596119</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.082</td>
<td valign="top" align="center">0.085</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.084</td>
<td valign="top" align="center">0.4175</td>
<td valign="top" align="center">41.75</td>
</tr>
<tr>
<td valign="top" align="center">19</td>
<td valign="top" align="center">chr10 98677603 98683109</td>
<td valign="top" align="center">0.099</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.069</td>
<td valign="top" align="center">0.084</td>
<td valign="top" align="center">0.42</td>
<td valign="top" align="center">42</td>
</tr>
<tr>
<td valign="top" align="center">20</td>
<td valign="top" align="center">chr1 108430301 108435591</td>
<td valign="top" align="center">0.107</td>
<td valign="top" align="center">0.078</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.093</td>
<td valign="top" align="center">0.4625</td>
<td valign="top" align="center">46.25</td>
</tr>
<tr>
<td valign="top" align="center">21</td>
<td valign="top" align="center">chrY 23381750 23386956</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.098</td>
<td valign="top" align="center">0.098</td>
<td valign="top" align="center">0.49</td>
<td valign="top" align="center">49</td>
</tr>
<tr>
<td valign="top" align="center">22</td>
<td valign="top" align="center">chr11 50352478 50357771</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.078</td>
<td valign="top" align="center">0.065</td>
<td valign="top" align="center">0.072</td>
<td valign="top" align="center">0.3575</td>
<td valign="top" align="center">35.75</td>
</tr>
<tr>
<td valign="top" align="center">23</td>
<td valign="top" align="center">chr11 49637737 49642530</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.085</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.085</td>
<td valign="top" align="center">0.425</td>
<td valign="top" align="center">42.5</td>
</tr>
<tr>
<td valign="top" align="center">25</td>
<td valign="top" align="center">chr12 102968149 102972730</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.031</td>
<td valign="top" align="center">0.031</td>
<td valign="top" align="center">0.155</td>
<td valign="top" align="center">15.5</td>
</tr>
<tr>
<td valign="top" align="center">26</td>
<td valign="top" align="center">chr3 109740319 109744759</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.078</td>
<td valign="top" align="center">0.078</td>
<td valign="top" align="center">0.39</td>
<td valign="top" align="center">39</td>
</tr>
<tr>
<td valign="top" align="center">27</td>
<td valign="top" align="center">chr11 14869711 14874159</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.049</td>
<td valign="top" align="center">0.049</td>
<td valign="top" align="center">0.245</td>
<td valign="top" align="center">24.5</td>
</tr>
<tr>
<td valign="top" align="center">28</td>
<td valign="top" align="center">chr4 64843173 64847502</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.062</td>
<td valign="top" align="center">0.062</td>
<td valign="top" align="center">0.31</td>
<td valign="top" align="center">31</td>
</tr>
<tr>
<td valign="top" align="center">29</td>
<td valign="top" align="center">chrX 34789238 34793597</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.040</td>
<td valign="top" align="center">0.040</td>
<td valign="top" align="center">0.2</td>
<td valign="top" align="center">20</td>
</tr>
<tr>
<td valign="top" align="center">30</td>
<td valign="top" align="center">chr8 44511870 44516437</td>
<td valign="top" align="center">0.105</td>
<td valign="top" align="center">0.075</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.090</td>
<td valign="top" align="center">0.45</td>
<td valign="top" align="center">45</td>
</tr>
<tr>
<td valign="top" align="center">31</td>
<td valign="top" align="center">chr6 155777868 155781847</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.093</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.093</td>
<td valign="top" align="center">0.465</td>
<td valign="top" align="center">46.5</td>
</tr>
<tr>
<td valign="top" align="center">32</td>
<td valign="top" align="center">chr19 24073629 24078094</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.076</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.076</td>
<td valign="top" align="center">0.38</td>
<td valign="top" align="center">38</td>
</tr>
<tr>
<td valign="top" align="center">33</td>
<td valign="top" align="center">chr4 77803811 77807756</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.075</td>
<td valign="top" align="center">0.075</td>
<td valign="top" align="center">0.375</td>
<td valign="top" align="center">37.5</td>
</tr>
<tr>
<td valign="top" align="center">34</td>
<td valign="top" align="center">chr8 12333790 12337817</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.065</td>
<td valign="top" align="center">0.065</td>
<td valign="top" align="center">0.325</td>
<td valign="top" align="center">32.5</td>
</tr>
<tr>
<td valign="top" align="center">35</td>
<td valign="top" align="center">chr7 6075204 6079128</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.066</td>
<td valign="top" align="center">0.066</td>
<td valign="top" align="center">0.33</td>
<td valign="top" align="center">33</td>
</tr>
<tr>
<td valign="top" align="center">36</td>
<td valign="top" align="center">chr8 43749874 43753733</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.087</td>
<td valign="top" align="center">0.087</td>
<td valign="top" align="center">0.435</td>
<td valign="top" align="center">43.5</td>
</tr>
<tr>
<td valign="top" align="center">40</td>
<td valign="top" align="center">chr4 77195305 77198763</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.084</td>
<td valign="top" align="center">0.084</td>
<td valign="top" align="center">0.42</td>
<td valign="top" align="center">42</td>
</tr>
<tr>
<td valign="top" align="center">41</td>
<td valign="top" align="center">chr2A 102337670 102341003</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.030</td>
<td valign="top" align="center">0.030</td>
<td valign="top" align="center">0.15</td>
<td valign="top" align="center">15</td>
</tr>
<tr>
<td valign="top" align="center">44</td>
<td valign="top" align="center">chr1 45743923 45746943</td>
<td valign="top" align="center">0.083</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.083</td>
<td valign="top" align="center">0.415</td>
<td valign="top" align="center">41.5</td>
</tr>
<tr>
<td valign="top" align="center">45</td>
<td valign="top" align="center">chrX 41627863 41630750</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.074</td>
<td valign="top" align="center">0.074</td>
<td valign="top" align="center">0.37</td>
<td valign="top" align="center">37</td>
</tr>
<tr>
<td valign="top" align="center">46</td>
<td valign="top" align="center">chrX 42154219 42156882</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.046</td>
<td valign="top" align="center">0.046</td>
<td valign="top" align="center">0.23</td>
<td valign="top" align="center">23</td>
</tr>
<tr>
<td valign="top" align="center">48</td>
<td valign="top" align="center">chr16 44723847 44726410</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.054</td>
<td valign="top" align="center">0.054</td>
<td valign="top" align="center">0.27</td>
<td valign="top" align="center">27</td>
</tr>
<tr>
<td valign="top" align="center">49</td>
<td valign="top" align="center">chrY 3095532 3098114</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.090</td>
<td valign="top" align="center">0.090</td>
<td valign="top" align="center">0.45</td>
<td valign="top" align="center">45</td>
</tr>
<tr>
<td valign="top" align="center">50</td>
<td valign="top" align="center">chrY 13438427 13440964</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.095</td>
<td valign="top" align="center">0.095</td>
<td valign="top" align="center">0.475</td>
<td valign="top" align="center">47.5</td>
</tr>
<tr>
<td valign="top" align="center">51</td>
<td valign="top" align="center">chr19 20847619 20850034</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.091</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.091</td>
<td valign="top" align="center">0.455</td>
<td valign="top" align="center">45.5</td>
</tr>
<tr>
<td valign="top" align="center">52</td>
<td valign="top" align="center">chr8 11324731 11327317</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.068</td>
<td valign="top" align="center">0.068</td>
<td valign="top" align="center">0.34</td>
<td valign="top" align="center">34</td>
</tr>
<tr>
<td valign="top" align="center">63</td>
<td valign="top" align="center">chr6 58293089 58294835</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.068</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">NA</td>
<td valign="top" align="center">0.068</td>
<td valign="top" align="center">0.34</td>
<td valign="top" align="center">34</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>&#x201c;NA&#x201d; stands for Not Applicable.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>Despite all this, there are significant differences in distribution quantity and structural form. The chimpanzees included 76 HML-8 proviral elements and 0 solo LTRs. By comparison, there are only 40 proviruses in the human genome, almost half as many as in the chimpanzee genome. In addition, the human genome also contains 5 solo LTRs. Solo LTRs arise from recombination between LTRs and the removal of intermediate regions of a provirus, and these recombination events mainly occur during meiotic recombination (<xref ref-type="bibr" rid="B17">Jia and Li, 2018</xref>). This significant difference precisely indicated that even after integration, the interaction between the pathogen and its host did not stop. The host genome can retain helpful or select against harmful proviral integrations. The chimpanzee genome contains more HML-8 proviral elements (76 vs. 40) and fewer solo LTRs (0 vs. 5) than humans. Since HML-8 integration occurred more than 30 million years prior to the divergence of chimpanzees and humans, the different distribution and number of these elements is likely due to differences in selection on these proviruses in the different species. This suggests that HML-8 integrations were retained at a greater rate in the chimpanzee genome than in the human genome, perhaps due to selection pressure differences or different rates of recombination during meiosis. Our results may suggest the difference in genome response to proviral integration contributed to the speciation event, which created humans and chimpanzees as distinct species.</p>
</sec>
<sec id="s3_5">
<label>3.5</label>
<title>Functional prediction of cis-regulatory regions and enrichment analysis</title>
<p>The LTR plays a crucial role in virus transcription and replication. Although most HML-8 LTRs are severely truncated, any regulatory sites present in the remaining sequence can play a role in the host genome&#x2019;s functional process as cis-regulatory regions. The tool of Genomic Regions Enrichment of Annotations Tool (GREAT) can predict the biological significance of these noncoding regions by analyzing annotations of nearby genes, i.e., based on spatial proximity. For the chimpanzee-specific HML-8 proviral LTRs, we selected LTR sequences larger than 70% of the reference sequence for further prediction. The results describing the associations between each proviral LTR and its putative-regulated gene(s) are shown in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S1</bold>
</xref>. Seven genes were predicted in total. Among them, 1 LTR was associated with 1 gene, and 3 LTRs were associated with 2 genes (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5A</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM2">
<bold>Supplementary Table S1</bold>
</xref>). No gene had an absolute distance from the transcription start site (TSS) of less than 5 kb. The absolute distance basically measures how far the gene is from the TSS. The absolute distances between the 4 genes and the TSS were 5 to 50 kb. The absolute distance between the 2 genes and the TSS was between 50 and 500 kb. The absolute distance between 1 gene and its TSS was greater than 500 kb (<xref ref-type="fig" rid="f5">
<bold>Figures&#xa0;5B, C</bold>
</xref>). To analyze the biological taxonomy of genes associated with LTRs, we produced GO Slim summaries to annotate these genes to functional categories. GO biological process (BP) analysis revealed that these genes were involved mainly in metabolic processes, responses to stimulus, localization, and biological regulation (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5D</bold>
</xref>). The GO Slim cellular component (CC) summary showed that these genes were significantly involved in the cytosol, mitochondrion, and endoplasmic reticulum, and the GO Slim molecular function (MF) summary revealed that these genes were significantly involved in protein binding, ion binding, and transferase activity (<xref ref-type="fig" rid="f5">
<bold>Figures&#xa0;5E, F</bold>
</xref>).</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>The genes associated with proviral LTRs and GO Slim summaries. <bold>(A)</bold> The number of associated genes per proviral LTR. <bold>(B)</bold> Binned by orientation and distance to the TSS. <bold>(C)</bold> Binned by the absolute distance to the TSS. The biological process <bold>(D)</bold>, cellular component <bold>(E)</bold>, and molecular function <bold>(F)</bold> categories are represented by red, blue, and green bars, respectively. The height of the bar represents the number of IDs in the gene list and in the category.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-14-1349046-g005.tif"/>
</fig>
<p>Moreover, these potential regulatory genes were subjected to enrichment analysis using WebGestalt. The top 10 most significant GO terms according to the FDR value for BPs included &#x201c;response to iron(II)ion&#x201d;, &#x201c;detoxification of nitrogen compound&#x201d;, &#x201c;toll-like receptor 7 signaling pathway&#x201d;, &#x201c;glutathione derivative metabolic process&#x201d;, &#x201c;glutathione metabolic process&#x201d;, &#x201c;sulfur compound biosynthetic process&#x201d;, &#x201c;cellular modified amino acid metabolic process&#x201d;, &#x201c;peptide metabolic process&#x201d;, and &#x201c;cellular amide metabolic process&#x201d; (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6A</bold>
</xref>).</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Enrichment result categories binned by biological process, cellular component, and molecular function. <bold>(A, B)</bold> Bar chart and customizable volcano plot of the biological process enrichment results. A bar graph showing the enrichment ratio of the results was constructed. Bars representing categories with an FDR&#x2009;&#x2264;&#x2009;0.05 are shown in a darker shade <bold>(A)</bold>. The volcano plot in <bold>(B)</bold> shows the log2 of the FDR versus the enrichment ratio for all the functional categories in the database, highlighting the degree to which the significant categories are separated from the background. The size and color of a dot are proportional to the number of overlaps (for ORA). The significantly enriched categories are labeled, and the labels are positioned automatically by a force field-based algorithm at startup. <bold>(C, D)</bold> Bar chart and customizable volcano plot of the cellular component enrichment results. <bold>(E, F)</bold> Bar chart and customizable volcano plot of the molecular function enrichment results.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-14-1349046-g006.tif"/>
</fig>
<p>The enrichment results for the CC and MF categories are shown in <xref ref-type="fig" rid="f6">
<bold>Figures&#xa0;6C&#x2013;F</bold>
</xref>. As repeatedly emphasized in our previous papers, all these results are entirely prediction-based, and future biological research is needed to confirm any of the implied associations between proviral LTRs and nearby genes.</p>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>ERV is an indispensable partner in the evolutionary process of primates. The integration and coevolution of ERVs can shape the host genome and participate in physiological and pathological processes (<xref ref-type="bibr" rid="B20">Johnson, 2019</xref>; <xref ref-type="bibr" rid="B16">Jansz and Faulkner, 2021</xref>; <xref ref-type="bibr" rid="B7">Chen et&#xa0;al., 2022</xref>). Therefore, it is critical to study the distribution of HML-8 loci in the chimpanzee genome to understand their evolutionary history and to inform future functional research. Previously, we conducted a comprehensive identification and characterization of the HML-8 group in the human genome (<xref ref-type="bibr" rid="B28">Liu et&#xa0;al., 2023</xref>). However, there is still a lack of comprehensive understanding of the evolutionary history of ERVs in other primates; for example, chimpanzees, which are the closest living genetic relatives to humans and share much of our genetic information, including ERV integrated in the genome. The distribution and function prediction of HML-8 in chimpanzees remain unclear and thus the comparisons of these elements between the two hosts cannot be carried out. We further characterized these remnants in chimpanzees and provided a detailed description of the HML-8 proviruses in the chimpanzee genome, including the HML-8 genome distribution, structural characteristics, phylogeny, integration time analysis, and regulatory function prediction.</p>
<p>We identified a total of 76 HML-8 proviral elements, and the results showed that the distribution of these proviral elements in the chimpanzee genome was nonrandom. Our previous studies have shown that the distribution of HML-8 loci in humans is not random (p&lt;0.005). Our comparison between HML-8 elements in the human and chimpanzee genomes showed that there is great similarity in the distribution of proviral chromosomal positions between chimpanzees and humans. Both genomes showed significant enrichment of proviral integration in the 11, 19, and Y chromosomes of chimpanzees compared to the predicted number.</p>
<p>Like in humans, the number of proviral elements integrated into the Y chromosome of chimpanzees was significantly greater than that predicted (p&lt;0.05). The Y chromosome is one of the two sex chromosomes that determines male sex. It not only is structurally complex but also the fastest-changing chromosome among human chromosomes. In addition to features related to sex determination, genes on the Y chromosome also have an impact on other traits and diseases in humans, such as the risk and severity of cancer (<xref ref-type="bibr" rid="B34">Rhie et&#xa0;al., 2023</xref>). There are several possible reasons for the insertions into the Y chromosome. The first possibility for additional provirus insertions may be due to the gene density on the Y chromosome, which became fixed in the population due to a decreased chance of gene disruption. An insertion on the Y chromosome may have a lower chance of being deleterious and, therefore, would be more likely to be retained and passed on to the next generation. In addition, the physical placement of the chromosome within the nucleus and the chromatin status also strongly influence whether a provirus can be inserted into that portion of the genome (<xref ref-type="bibr" rid="B34">Rhie et&#xa0;al., 2023</xref>). Anyhow, ERV enrichment on the Y chromosome could suggest that these elements may be deeply involved in reproduction, disease, and other unresolved processes.</p>
<p>Structural characterization revealed that no HML-8 members retained near full-length proviral structures. All the HML-8 elements have become fragmented due to insertion, deletion, or other mutations during the long history of evolution, including a total of 63 complete deletions of the 5&#x2019; LTR sequence and 25 complete deletions of the 3&#x2019; LTR of the proviruses. The middle four open reading frames (<italic>gag</italic>, <italic>pro</italic>, <italic>pol</italic>, and <italic>env</italic>) had 43, 34, 19, and 11 complete deletions, respectively. Such a large-scale deficiency reflects the host&#x2019;s ability to reshape foreign elements, screening out harmful elements and leaving behind useful elements. Subregion phylogenetic analysis of 4 internal regions revealed that 15 <italic>gag</italic> elements, 19 <italic>pro</italic> elements, 15 <italic>pol</italic> elements, and 33 <italic>env</italic> sequences formed a unique cluster, each of which was supported by strong bootstrap values, confirming their assignment with great certainty.</p>
<p>The integration time of most HML-8 elements (<italic>gag</italic>, <italic>pro</italic>, <italic>pol</italic>, and <italic>env</italic>) found in the chimpanzee genome is mainly between 15 and 52.33 mya, with an average integration time of 35.86 mya and a median of 37.25 mya, which are very similar to those of humans. These results further confirmed that HML-8 was integrated before the divergence between human and chimpanzee ancestors, which occurred approximately 6.5&#x2013;7.5 mya ago. The integration and coevolution of ERVs can reshape the host genome and participate in physiological and pathological processes (<xref ref-type="bibr" rid="B20">Johnson, 2019</xref>; <xref ref-type="bibr" rid="B16">Jansz and Faulkner, 2021</xref>; <xref ref-type="bibr" rid="B7">Chen et&#xa0;al., 2022</xref>). The significant differences in quantity and structure of HML-8 between humans and chimpanzees obtained from the present study indicated that, in turn, the host will also screen and reshape the external elements integrated from the outside. Even after proviral integration has completed, interactions between the host genome and the inserted provirus continue. Integrated exogenous retroviruses will undergo genetic recombination according to the evolutionary mechanisms of the host genome following meiotic recombination, site-specific recombination, and transpositional recombination (<xref ref-type="bibr" rid="B18">Jia et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B17">Jia and Li, 2018</xref>). A typical remnant of the original and complete provirus is solo LTR which arise from host homologous recombination between ancestral 5&#x2019; and 3&#x2019; proviral LTRs, where the intervening protein-coding sequence is deleted (<xref ref-type="bibr" rid="B30">Mager and Goodchild, 1989</xref>; <xref ref-type="bibr" rid="B15">Hughes and Coffin, 2004</xref>; <xref ref-type="bibr" rid="B17">Jia and Li, 2018</xref>; <xref ref-type="bibr" rid="B39">Thomas et&#xa0;al., 2018</xref>). It was reported that at least 85% of reference genome ERV instances are solo LTRs (<xref ref-type="bibr" rid="B25">Lander et&#xa0;al., 2001</xref>; <xref ref-type="bibr" rid="B31">Mager and Stoye, 2015</xref>; <xref ref-type="bibr" rid="B39">Thomas et&#xa0;al., 2018</xref>). Compared to humans, chimpanzees maintain many more proviral elements and fewer solo LTRs, indicating that the active interaction between the chimpanzee genome and the integrated proviruses is lower than that of the human genome which has a greater ability to shape integrated proviral elements.</p>
<p>In summary, we have described in detail the existence and distribution of HML-8 elements in the chimpanzee genome, as well as the structural characterization and phylogenetic analysis of these remnants. In addition, we further predicted the potential biological function of the genes related to proviral LTRs via bioinformatics methods. Our work revealed that the chimpanzee genome contains fewer chimpanzee-specific HML-8 solo LTR integration but more chimpanzee-specific HML-8 provirus integration, suggesting that HML-8 elements evolved in different ways after the divergence of human and chimpanzee ancestors. The results of the present study could provide a comprehensive research background for the differences between human and chimpanzee genomes and the potential implications in the future.</p>
</sec>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found in the article/<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material</bold>
</xref>.</p>
</sec>
<sec id="s6" sec-type="author-contributions">
<title>Author contributions</title>
<p>CW: Writing &#x2013; original draft, Data curation, Formal analysis. XZ: Writing &#x2013; original draft, Formal analysis, Methodology. SW: Writing &#x2013; original draft, Data curation, Methodology. BZ: Software, Writing &#x2013; review &amp; editing. CY: Software, Writing &#x2013; review &amp; editing. YS: Validation, Writing &#x2013; review &amp; editing. HL: Writing &#x2013; review &amp; editing, Validation. YL: Writing &#x2013; review &amp; editing, Validation. JH: Writing &#x2013; review &amp; editing, Visualization. XW: Writing &#x2013; review &amp; editing, Visualization. JL: Writing &#x2013; review &amp; editing, Visualization. MC: Writing &#x2013; review &amp; editing, Data curation, Methodology. LJ: Writing &#x2013; review &amp; editing, Conceptualization, Data curation, Formal analysis, Methodology, Writing &#x2013; original draft. LL: Conceptualization, Writing &#x2013; review &amp; editing, Data curation, Formal analysis, Writing &#x2013; original draft.</p>
</sec>
</body>
<back>
<sec id="s7" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research, authorship, and/or publication of this article. This study was supported by the State Key Laboratory of Pathogen and Biosecurity (SKLPBS2138).</p>
</sec>
<sec id="s8" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s9" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fcimb.2024.1349046/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fcimb.2024.1349046/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet_1.xlsx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="DataSheet_2.xlsx" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bannert</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Kurth</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Retroelements and the human genome: new perspectives on an old relation</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>101 Suppl 2</volume>, <fpage>14572</fpage>&#x2013;<lpage>14579</lpage>.  doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.0404838101</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bannert</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Kurth</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>The evolutionary dynamics of human endogenous retroviral families</article-title>. <source>Annu. Rev. Genomics Hum. Genet.</source> <volume>7</volume>, <fpage>149</fpage>&#x2013;<lpage>173</lpage>. doi: <pub-id pub-id-type="doi">10.1146/annurev.genom.7.080505.115700</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Barbulescu</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Turner</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Seaman</surname> <given-names>M. I.</given-names>
</name>
<name>
<surname>Deinard</surname> <given-names>A. S.</given-names>
</name>
<name>
<surname>Kidd</surname> <given-names>K. K.</given-names>
</name>
<name>
<surname>Lenz</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>1999</year>). <article-title>Many human endogenous retrovirus K (HERV-K) proviruses are unique to humans</article-title>. <source>Curr. Biol.: CB.</source> <volume>9</volume>, <fpage>861</fpage>&#x2013;<lpage>868</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0960-9822(99)80390-X</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Benachenhou</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Sperber</surname> <given-names>G. O.</given-names>
</name>
<name>
<surname>Bongcam-Rudloff</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Andersson</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Boeke</surname> <given-names>J. D.</given-names>
</name>
<name>
<surname>Blomberg</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Conserved structure and inferred evolutionary history of long terminal repeats (LTRs)</article-title>. <source>Mob. DNA</source> <volume>4</volume>, <elocation-id>5</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1759-8753-4-5</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brady</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>Y. N.</given-names>
</name>
<name>
<surname>Ronen</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Malani</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Berry</surname> <given-names>C. C.</given-names>
</name>
<name>
<surname>Bieniasz</surname> <given-names>P. D.</given-names>
</name>
<etal/>
</person-group>. (<year>2009</year>). <article-title>Integration target site selection by a resurrected human endogenous retrovirus</article-title>. <source>Genes Dev.</source> <volume>23</volume>, <fpage>633</fpage>&#x2013;<lpage>642</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/gad.1762309</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Broecker</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Horton</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Heinrich</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Franz</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Schweiger</surname> <given-names>M.-R.</given-names>
</name>
<name>
<surname>Lehrach</surname> <given-names>H.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>The intron-enriched HERV-K(HML-10) family suppresses apoptosis, an indicator of Malignant transformation</article-title>. <source>Mobile. DNA</source> <volume>7</volume>, <fpage>25</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13100-016-0081-9</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Jia</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Han</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Ancient human endogenous retroviruses contribute to genetic evolution and regulate cancer cell type&#x2013;specific gene expression</article-title>. <source>Cancer Res.</source> <volume>82</volume>, <fpage>3457</fpage>&#x2013;<lpage>3473</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1158/0008-5472.CAN-22-0290</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Flockerzi</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Burkhardt</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Schempp</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Meese</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Mayer</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Human endogenous retrovirus HERV-K14 families: status, variants, evolution, and mobilization of other cellular sequences</article-title>. <source>J. Virol.</source> <volume>79</volume>, <fpage>2941</fpage>&#x2013;<lpage>2949</lpage>. doi: <pub-id pub-id-type="doi">10.1128/JVI.79.5.2941-2949.2005</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Garcia-Montojo</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Doucet-O&#x2019;Hare</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Henderson</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Nath</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Human endogenous retrovirus-K (HML-2): a comprehensive review</article-title>. <source>Crit. Rev. In. Microbiol.</source> <volume>44</volume>, <fpage>715</fpage>&#x2013;<lpage>738</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/1040841X.2018.1501345</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Grandi</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Cadeddu</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Pisano</surname> <given-names>M. P.</given-names>
</name>
<name>
<surname>Esposito</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Blomberg</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Tramontano</surname> <given-names>E.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Identification of a novel HERV-K(HML10): comprehensive characterization and comparative analysis in non-human primates provide insights about HML10 proviruses structure and diffusion</article-title>. <source>Mobile. DNA</source> <volume>8</volume>, <fpage>15</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13100-017-0099-7</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Grandi</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Pisano</surname> <given-names>M. P.</given-names>
</name>
<name>
<surname>Pessiu</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Scognamiglio</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Tramontano</surname> <given-names>E.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>HERV-K(HML7) integrations in the human genome: comprehensive characterization and comparative analysis in non-human primates</article-title>. <source>Biol. (Basel).</source> <volume>10</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/biology10050439</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Grow</surname> <given-names>E. J.</given-names>
</name>
<name>
<surname>Flynn</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Chavez</surname> <given-names>S. L.</given-names>
</name>
<name>
<surname>Bayless</surname> <given-names>N. L.</given-names>
</name>
<name>
<surname>Wossidlo</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Wesche</surname> <given-names>D. J.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>Intrinsic retroviral reactivation in human preimplantation embryos and pluripotent cells</article-title>. <source>Nature</source> <volume>522</volume>, <fpage>221</fpage>&#x2013;<lpage>225</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nature14308</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Holloway</surname> <given-names>J. R.</given-names>
</name>
<name>
<surname>Williams</surname> <given-names>Z. H.</given-names>
</name>
<name>
<surname>Freeman</surname> <given-names>M. M.</given-names>
</name>
<name>
<surname>Bulow</surname> <given-names>U.</given-names>
</name>
<name>
<surname>Coffin</surname> <given-names>J. M.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Gorillas have been infected with the HERV-K (HML-2) endogenous retrovirus much more recently than humans and chimpanzees</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>116</volume>, <fpage>1337</fpage>&#x2013;<lpage>1346</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1814203116</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hubley</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Finn</surname> <given-names>R. D.</given-names>
</name>
<name>
<surname>Clements</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Eddy</surname> <given-names>S. R.</given-names>
</name>
<name>
<surname>Jones</surname> <given-names>T. A.</given-names>
</name>
<name>
<surname>Bao</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>The Dfam database of repetitive DNA families</article-title>. <source>Nucleic Acids Res.</source> <volume>44</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkv1272</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hughes</surname> <given-names>J. F.</given-names>
</name>
<name>
<surname>Coffin</surname> <given-names>J. M.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Human endogenous retrovirus K solo-LTR formation and insertional polymorphisms: Implications for human and viral evolution</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>101</volume>, <fpage>1668</fpage>&#x2013;<lpage>1672</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.0307885100</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jansz</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Faulkner</surname> <given-names>G. J.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Endogenous retroviruses in the origins and treatment of cancer</article-title>. <source>Genome Biol.</source> <volume>22</volume>, <fpage>147</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13059-021-02357-4</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Jia</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Transpositional recombination and site-specific Recombination May Be Initiated by Copy Choice during DNA Synthesis Rather Than Break/Join Mechanism</article-title>. <source>Preprints</source> doi: <pub-id pub-id-type="doi">10.20944/preprints201808.0317.v1</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jia</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Gui</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Han</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>Analysis of HIV-1 intersubtype recombination breakpoints suggests region with high pairing probability may be a more fundamental factor than sequence similarity affecting HIV-1 recombination</article-title>. <source>Virol. J.</source> <volume>13</volume>, <fpage>156</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12985-016-0616-1</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jia</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Han</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Comprehensive identification and characterization of the HERV-K (HML-9) group in the human genome</article-title>. <source>Retrovirology</source> <volume>19</volume>, <elocation-id>11</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12977-022-00596-2</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Johnson</surname> <given-names>W. E.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Origins and evolutionary consequences of ancient endogenous retroviruses</article-title>. <source>Nat. Rev. Microbiol.</source> <volume>17</volume>, <fpage>355</fpage>&#x2013;<lpage>370</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41579-019-0189-2</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kent</surname> <given-names>W. J.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>BLAT&#x2013;the BLAST-like alignment tool</article-title>. <source>Genome Res.</source> <volume>12</volume>, <fpage>656</fpage>&#x2013;<lpage>664</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/gr.229202</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kent</surname> <given-names>W. J.</given-names>
</name>
<name>
<surname>Sugnet</surname> <given-names>C. W.</given-names>
</name>
<name>
<surname>Furey</surname> <given-names>T. S.</given-names>
</name>
<name>
<surname>Roskin</surname> <given-names>K. M.</given-names>
</name>
<name>
<surname>Pringle</surname> <given-names>T. H.</given-names>
</name>
<name>
<surname>Zahler</surname> <given-names>A. M.</given-names>
</name>
<etal/>
</person-group>. (<year>2002</year>). <article-title>The human genome browser at UCSC</article-title>. <source>Genome Res.</source> <volume>12</volume>, <fpage>996</fpage>&#x2013;<lpage>1006</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/gr.229102</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kumar</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Stecher</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Tamura</surname> <given-names>K.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>MEGA7: molecular evolutionary genetics analysis version 7.0 for bigger datasets</article-title>. <source>Mol. Biol. Evol.</source> <volume>33</volume>, <fpage>1870</fpage>&#x2013;<lpage>1874</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msw054</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kunarso</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Chia</surname> <given-names>N. Y.</given-names>
</name>
<name>
<surname>Jeyakani</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Hwang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Chan</surname> <given-names>Y. S.</given-names>
</name>
<etal/>
</person-group>. (<year>2010</year>). <article-title>Transposable elements have rewired the core regulatory network of human embryonic stem cells</article-title>. <source>Nat. Genet.</source> <volume>42</volume>, <fpage>631</fpage>&#x2013;<lpage>634</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/ng.600</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lander</surname> <given-names>E. S.</given-names>
</name>
<name>
<surname>Linton</surname> <given-names>L. M.</given-names>
</name>
<name>
<surname>Birren</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Nusbaum</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Zody</surname> <given-names>M. C.</given-names>
</name>
<name>
<surname>Baldwin</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2001</year>). <article-title>Initial sequencing and analysis of the human genome</article-title>. <source>Nature</source> <volume>409</volume>, <fpage>860</fpage>&#x2013;<lpage>921</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/35057062</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lavie</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Medstrand</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Schempp</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Meese</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Mayer</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Human endogenous retrovirus family HERV-K(HML-5): status, evolution, and reconstruction of an ancient betaretrovirus in the human genome</article-title>. <source>J. Virol.</source> <volume>78</volume>, <fpage>8788</fpage>&#x2013;<lpage>8798</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/JVl.78.16.8788-8798.200</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lebedev</surname> <given-names>Y. B.</given-names>
</name>
<name>
<surname>Belonovitch</surname> <given-names>O. S.</given-names>
</name>
<name>
<surname>Zybrova</surname> <given-names>N. V.</given-names>
</name>
<name>
<surname>Khil</surname> <given-names>P. P.</given-names>
</name>
<name>
<surname>Kurdyukov</surname> <given-names>S. G.</given-names>
</name>
<name>
<surname>Vinogradova</surname> <given-names>T. V.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>Differences in HERV-K LTR insertions in orthologous loci of humans and great apes</article-title>. <source>Gene</source> <volume>247</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/s0378-1119(00)00062-7</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Jia</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Zhai</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Y.</given-names>
</name>
<etal/>
</person-group>. (<year>2023</year>). <article-title>Identification and characterization of the HERV-K (HML-8) group of human endogenous retroviruses in the genome</article-title>. <source>AIDS Res. Hum. Retroviruses</source> <volume>39</volume>, <fpage>176</fpage>&#x2013;<lpage>194</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1089/aid.2022.0084</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Macfarlane</surname> <given-names>C. M.</given-names>
</name>
<name>
<surname>Badge</surname> <given-names>R. M.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Genome-wide amplification of proviral sequences reveals new polymorphic HERV-K(HML-2) proviruses in humans and chimpanzees that are absent from genome assemblies</article-title>. <source>Retrovirology</source> <volume>12</volume>, <fpage>35</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12977-015-0162-8</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mager</surname> <given-names>D. L.</given-names>
</name>
<name>
<surname>Goodchild</surname> <given-names>N. L.</given-names>
</name>
</person-group> (<year>1989</year>). <article-title>Homologous recombination between the LTRs of a human retrovirus-like element causes a 5-kb deletion in two siblings</article-title>. <source>Am. J. Hum. Genet.</source> <volume>45</volume>, <fpage>848</fpage>&#x2013;<lpage>854</lpage>.</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mager</surname> <given-names>D. L.</given-names>
</name>
<name>
<surname>Stoye</surname> <given-names>J. P.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Mammalian endogenous retroviruses</article-title>. <source>Microbiology Spectrum</source> <volume>3</volume> (<issue>1</issue>), <fpage>MDNA3-0009-2014</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/microbiolspec.mdna1123-0009-2014</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ono</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>1986</year>). <article-title>Molecular cloning and long terminal repeat sequences of human endogenous retrovirus genes related to types A and B retrovirus genes</article-title>. <source>J. Virol.</source> <volume>58</volume>, <fpage>937</fpage>&#x2013;<lpage>944</lpage>. doi: <pub-id pub-id-type="doi">10.1128/jvi.58.3.937-944.1986</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pisano</surname> <given-names>M. P.</given-names>
</name>
<name>
<surname>Grandi</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Cadeddu</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Blomberg</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Tramontano</surname> <given-names>E.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Comprehensive characterization of the human endogenous retrovirus HERV-K(HML-6) group: overview of structure, phylogeny, and contribution to the human genome</article-title>. <source>J. Virol.</source> <volume>93</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/jvi.00110-19</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rhie</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Nurk</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Cechova</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Hoyt</surname> <given-names>S. J.</given-names>
</name>
<name>
<surname>Taylor</surname> <given-names>D. J.</given-names>
</name>
<name>
<surname>Altemose</surname> <given-names>N.</given-names>
</name>
<etal/>
</person-group>. (<year>2023</year>). <article-title>The complete sequence of a human Y chromosome</article-title>. <source>Nature</source> <volume>621</volume>, <fpage>344</fpage>&#x2013;<lpage>354</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41586-023-06457-y</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Scognamiglio</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Grandi</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Pessiu</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Tramontano</surname> <given-names>E.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Identification, comprehensive characterization, and comparative genomics of the HERV-K(HML8) integrations in the human genome</article-title>. <source>Virus Res.</source> <volume>323</volume>, <elocation-id>198976</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.virusres.2022.198976</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stoye</surname> <given-names>J. P.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Studies of endogenous retroviruses reveal a continuing evolutionary saga</article-title>. <source>Nat. Rev. Microbiol.</source> <volume>10</volume>, <fpage>395</fpage>&#x2013;<lpage>406</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nrmicro2783</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Subramanian</surname> <given-names>R. P.</given-names>
</name>
<name>
<surname>Wildschutte</surname> <given-names>J. H.</given-names>
</name>
<name>
<surname>Russo</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Coffin</surname> <given-names>J. M.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Identification, characterization, and comparative genomic distribution of the HERV-K (HML-2) group of human endogenous retroviruses</article-title>. <source>Retrovirology</source> <volume>8</volume>, <elocation-id>90</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1742-4690-8-90</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tamura</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Stecher</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Kumar</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>MEGA11: molecular evolutionary genetics analysis version 11</article-title>. <source>Mol. Biol. Evol.</source> <volume>38</volume>, <fpage>3022</fpage>&#x2013;<lpage>3027</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msab120</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thomas</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Perron</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Feschotte</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Variation in proviral content among human genomes mediated by LTR recombination</article-title>. <source>Mobile. DNA</source> <volume>9</volume>, <fpage>36</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13100-018-0142-3</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vargiu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Rodriguez-Tom&#xe9;</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Sperber</surname> <given-names>G. O.</given-names>
</name>
<name>
<surname>Cadeddu</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Grandi</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Blikstad</surname> <given-names>V.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>Classification and characterization of human endogenous retroviruses; mosaic forms are common</article-title>. <source>Retrovirology</source> <volume>13</volume>, <elocation-id>7</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12977-015-0232-y</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Venter</surname> <given-names>J. C.</given-names>
</name>
<name>
<surname>Adams</surname> <given-names>M. D.</given-names>
</name>
<name>
<surname>Myers</surname> <given-names>E. W.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>P. W.</given-names>
</name>
<name>
<surname>Mural</surname> <given-names>R. J.</given-names>
</name>
<name>
<surname>Sutton</surname> <given-names>G. G.</given-names>
</name>
<etal/>
</person-group>. (<year>2001</year>). <article-title>The sequence of the human genome</article-title>. <source>Science</source> <volume>291</volume>, <fpage>1304</fpage>&#x2013;<lpage>1351</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.1058040</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>