<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mol. Biosci.</journal-id>
<journal-title>Frontiers in Molecular Biosciences</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mol. Biosci.</abbrev-journal-title>
<issn pub-type="epub">2296-889X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmolb.2016.00076</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Molecular Biosciences</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Patterns of Transposable Element Expression and Insertion in Cancer</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Clayton</surname> <given-names>Evan A.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/370966/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Lu</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Rishishwar</surname> <given-names>Lavanya</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/373745/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Jianrong</given-names></name>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>McDonald</surname> <given-names>John F.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/373842/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Jordan</surname> <given-names>I. King</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/372301/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Integrated Cancer Research Center, School of Biology, Georgia Institute of Technology</institution> <country>Atlanta, GA, USA</country></aff>
<aff id="aff2"><sup>2</sup><institution>Ovarian Cancer Institute</institution> <country>Atlanta, GA, USA</country></aff>
<aff id="aff3"><sup>3</sup><institution>School of Biology, Georgia Institute of Technology</institution> <country>Atlanta, GA, USA</country></aff>
<aff id="aff4"><sup>4</sup><institution>PanAmerican Bioinformatics Institute</institution> <country>Cali, Colombia</country></aff>
<aff id="aff5"><sup>5</sup><institution>Applied Bioinformatics Laboratory</institution> <country>Atlanta, GA, USA</country></aff>
<aff id="aff6"><sup>6</sup><institution>Department of Computational Mathematics, Science and Engineering, Michigan State University</institution> <country>East Lansing, MI, USA</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Tammy A. Morrish, Formerly affiliated with University of Toledo, USA</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: David Ray, Mississippi State University, USA; David E. Symer, Ohio State University Comp. Cancer Ctr., USA; Tara Theresa Doucet-O&#x00027;Hare, National Institutes of Health, USA</p></fn>
<fn fn-type="corresp" id="fn001"><p>&#x0002A;Correspondence: I. King Jordan <email>king.jordan&#x00040;biology.gatech.edu</email></p></fn>
<fn fn-type="other" id="fn002"><p>This article was submitted to Cellular Biochemistry, a section of the journal Frontiers in Molecular Biosciences</p></fn></author-notes>
<pub-date pub-type="epub">
<day>16</day>
<month>11</month>
<year>2016</year>
</pub-date>
<pub-date pub-type="collection">
<year>2016</year>
</pub-date>
<volume>3</volume>
<elocation-id>76</elocation-id>
<history>
<date date-type="received">
<day>24</day>
<month>08</month>
<year>2016</year>
</date>
<date date-type="accepted">
<day>31</day>
<month>10</month>
<year>2016</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2016 Clayton, Wang, Rishishwar, Wang, McDonald and Jordan.</copyright-statement>
<copyright-year>2016</copyright-year>
<copyright-holder>Clayton, Wang, Rishishwar, Wang, McDonald and Jordan</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) or licensor are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract><p>Human transposable element (TE) activity in somatic tissues causes mutations that can contribute to tumorigenesis. Indeed, TE insertion mutations have been implicated in the etiology of a number of different cancer types. Nevertheless, the full extent of somatic TE activity, along with its relationship to tumorigenesis, have yet to be fully explored. Recent developments in bioinformatics software make it possible to analyze TE expression levels and TE insertional activity directly from transcriptome (RNA-seq) and whole genome (DNA-seq) next-generation sequence data. We applied these new sequence analysis techniques to matched normal and primary tumor patient samples from the Cancer Genome Atlas (TCGA) in order to analyze the patterns of TE expression and insertion for three cancer types: breast invasive carcinoma, head and neck squamous cell carcinoma, and lung adenocarcinoma. Our analysis focused on the three most abundant families of active human TEs: Alu, SVA, and L1. We found evidence for high levels of somatic TE activity for these three families in normal and cancer samples across diverse tissue types. Abundant transcripts for all three TE families were detected in both normal and cancer tissues along with an average of &#x0007E;80 unique TE insertions per individual patient/tissue. We observed an increase in L1 transcript expression and L1 insertional activity in primary tumor samples for all three cancer types. Tumor-specific TE insertions are enriched for private mutations, consistent with a potentially causal role in tumorigenesis. We used genome feature analysis to investigate two specific cases of putative cancer-causing TE mutations in further detail. An Alu insertion in an upstream enhancer of the <italic>CBL</italic> tumor suppressor gene is associated with down-regulation of the gene in a single breast cancer patient, and an L1 insertion in the first exon of the <italic>BAALC</italic> gene also disrupts its expression in head and neck squamous cell carcinoma. Our results are consistent with widespread somatic activity of human TEs leading to numerous insertion mutations that can contribute to tumorigenesis in a variety of tissues.</p></abstract>
<kwd-group>
<kwd>LINE-1</kwd>
<kwd>L1</kwd>
<kwd>Alu</kwd>
<kwd>SVA</kwd>
<kwd>retrotransposons</kwd>
<kwd>bioinformatics</kwd>
<kwd>mutation</kwd>
<kwd>tumorigenesis</kwd>
</kwd-group>
<counts>
<fig-count count="4"/>
<table-count count="2"/>
<equation-count count="0"/>
<ref-count count="71"/>
<page-count count="11"/>
<word-count count="7774"/>
</counts>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>Introduction</title>
<p>More than 50% of the human genome sequence is derived from transposable element (TE) insertions (Lander et al., <xref ref-type="bibr" rid="B35">2001</xref>; de Koning et al., <xref ref-type="bibr" rid="B20">2011</xref>). The vast majority of TE-derived sequences in the human genome correspond to relatively ancient insertions that are no longer capable of transposition (Mills et al., <xref ref-type="bibr" rid="B42">2007</xref>). However, there are several families of human TEs that remain active to this day. The most abundant families of active TEs in the human genome are the Alu and SVA short interspersed nuclear elements (SINEs) along with the L1 Long Interspersed Nuclear Element (LINE) family (Kazazian et al., <xref ref-type="bibr" rid="B33">1988</xref>; Batzer and Deininger, <xref ref-type="bibr" rid="B7">1991</xref>; Batzer et al., <xref ref-type="bibr" rid="B9">1991</xref>; Brouha et al., <xref ref-type="bibr" rid="B15">2003</xref>; Ostertag et al., <xref ref-type="bibr" rid="B46">2003</xref>; Wang et al., <xref ref-type="bibr" rid="B68">2005</xref>). Alu and SVA SINEs are non-autonomous TEs that are mobilized via the transpositional machinery encoded by the autonomous L1 family of LINEs. Recent evidence indicates that a handful of HERV-K endogenous retroviral elements also remain active in the human genome (Wildschutte et al., <xref ref-type="bibr" rid="B70">2016</xref>).</p>
<p>Active TE families are of great interest since they have the ability to generate <italic>de novo</italic> mutations, many of which have been linked to human disease (Hancks and Kazazian, <xref ref-type="bibr" rid="B28">2012</xref>; Solyom and and Kazazian, <xref ref-type="bibr" rid="B61">2012</xref>). For instance, TE insertions have been shown to contribute to the etiology of a variety of different cancer types (Belancio et al., <xref ref-type="bibr" rid="B10">2010a</xref>; Carreira et al., <xref ref-type="bibr" rid="B16">2014</xref>). Numerous recent studies have used a combination of next-generation sequence analysis, followed by validation with PCR and/or Sanger sequencing, to elucidate connections between TE activity and cancer (Solyom et al., <xref ref-type="bibr" rid="B60">2012</xref>; Shukla et al., <xref ref-type="bibr" rid="B59">2013</xref>; Tubio et al., <xref ref-type="bibr" rid="B66">2014</xref>; Doucet-O&#x00027;Hare et al., <xref ref-type="bibr" rid="B21">2015</xref>; Ewing et al., <xref ref-type="bibr" rid="B24">2015</xref>). L1 insertions in particular have been implicated as potential cancer causing mutations in those and other studies (Morse et al., <xref ref-type="bibr" rid="B44">1988</xref>; Miki et al., <xref ref-type="bibr" rid="B41">1992</xref>; Iskow et al., <xref ref-type="bibr" rid="B31">2010</xref>; Lee et al., <xref ref-type="bibr" rid="B36">2012</xref>; Scott et al., <xref ref-type="bibr" rid="B57">2016</xref>). L1 activity is thought to promote tumor development by causing genomic instability, via impaired chromosomal pairing during mitosis, and/or by disrupting coding or regulatory sequences (Kemp and Longworth, <xref ref-type="bibr" rid="B34">2015</xref>).</p>
<p>Many of the studies that have related TEs to cancer have considered TE expression, at the transcript or protein level, and TE insertional activity separately. A number of different cancer types are positive for L1 transcript expression (Belancio et al., <xref ref-type="bibr" rid="B11">2010b</xref>), and L1 proteins have been shown to be ubiquitously expressed in both normal and tumor samples from the same individuals (Bratthauer and Fanning, <xref ref-type="bibr" rid="B13">1992</xref>, <xref ref-type="bibr" rid="B14">1993</xref>; Bratthauer et al., <xref ref-type="bibr" rid="B12">1994</xref>; Asch et al., <xref ref-type="bibr" rid="B5">1996</xref>; Doucet-O&#x00027;Hare et al., <xref ref-type="bibr" rid="B21">2015</xref>, <xref ref-type="bibr" rid="B22">2016</xref>). There is also evidence suggesting that L1 protein expression can be limited to tumor tissues and thereby serve as a useful cancer biomarker; nearly half of all human cancers are exclusively immunoreactive for L1-ORF1 encoded proteins (Rodic et al., <xref ref-type="bibr" rid="B55">2014</xref>). The expression of L1 proteins in tumors has been shown to affect the expression of a number of cancer-related genes, including the down-regulation of tumor suppressors (Rangasamy et al., <xref ref-type="bibr" rid="B51">2015</xref>). With respect to TE insertional activity, studies on matched normal and tumor tissues have found that novel L1 insertions occur at high frequencies in lung cancer genomes (Iskow et al., <xref ref-type="bibr" rid="B31">2010</xref>). Such insertions frequently occur in oncogenes and tumor suppressors, underscoring their putative role in tumorigenesis (Lee et al., <xref ref-type="bibr" rid="B36">2012</xref>).</p>
<p>A principal challenge when interpreting cancer genomes is distinguishing between so-called passenger and driver mutations. While passenger mutations are present in cancer genomes, they are not considered to contribute to cancer progression; instead, they are simply somatic mutations that arise during carcinogenesis and are carried along during clonal expansion. Driver mutations, on the other hand, are causal mutations that are directly implicated in carcinogenesis and the promotion of cancer growth (Stratton et al., <xref ref-type="bibr" rid="B62">2009</xref>; Marx, <xref ref-type="bibr" rid="B40">2014</xref>; Pon and Marra, <xref ref-type="bibr" rid="B48">2015</xref>). To date, only a few studies have directly implicated TE insertions as cancer driver mutations. One such study analyzed 19 hepatocellular carcinoma genomes utilizing the RC-Seq methodology (Baillie et al., <xref ref-type="bibr" rid="B6">2011</xref>) and discovered two separate L1 insertions that initiate tumorigenesis via distinct oncogenic pathways (Shukla et al., <xref ref-type="bibr" rid="B59">2013</xref>). This study found L1 insertions in two different tumor suppressor genes: Mutated in Colorectal Cancers (<italic>MCC</italic>) and Suppression of Tumorigenicity (<italic>ST18</italic>). Most recently, a role for L1 insertional activity was conclusively demonstrated for colorectal cancer caused by an insertion in the <italic>APC</italic> tumor suppressor gene (Scott et al., <xref ref-type="bibr" rid="B57">2016</xref>). This paper describes a somatic L1 insertion into one copy of the <italic>APC</italic> gene that, when coupled with a point mutation in the other copy of the gene, initiates tumorigenesis through the two hit colorectal cancer pathway.</p>
<p>Owing to parallel developments in genomics and bioinformatics, it is now possible to jointly analyze the patterns of TE transcript expression and TE insertional activity in human cancers. The Cancer Genome Atlas (TCGA) provides access to both transcriptome sequence data (RNA-seq) and whole genome sequence data (DNA-seq) for a number of matched normal and primary tumor sample pairs from individual patients (Weinstein et al., <xref ref-type="bibr" rid="B69">2013</xref>). In addition, recently developed bioinformatics algorithms allow for the detection of TE transcripts directly from RNA-seq data (Jin et al., <xref ref-type="bibr" rid="B32">2015</xref>) as well as for the characterization of novel TE insertions from DNA-seq data (Thung et al., <xref ref-type="bibr" rid="B64">2014</xref>; Sudmant et al., <xref ref-type="bibr" rid="B63">2015</xref>). We took advantage of these developments in order to evaluate the patterns of both TE expression and insertional activity in three cancer types: breast invasive carcinoma, head, and neck squamous cell carcinoma, and lung adenocarcinoma (Figure <xref ref-type="fig" rid="F1">1</xref> and Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">1</xref>). We observed a simultaneous increase of L1 transcript expression and L1 insertional activity for primary tumor samples for all three cancers, and we evaluate individual cases of TE insertions that are implicated as potential cancer causing mutations.</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p><bold>Scheme of the analytical design used in this study</bold>. Matched normal and primary tumor samples for three cancer types were analyzed using transcriptome (RNA-seq) and whole genome (DNA-seq) data. RNA-seq data was analyzed to compare normal versus cancer expression levels, and DNA-seq data was analyzed to identify somatic TE insertion events. The main bioinformatics programs (wrench) and databases (cylinder) used for each phase of the analysis are indicated.</p></caption>
<graphic xlink:href="fmolb-03-00076-g0001.tif"/>
</fig>
</sec>
<sec sec-type="materials and methods" id="s2">
<title>Materials and methods</title>
<sec>
<title>Genome and transcriptome sequence data</title>
<p>Whole genome sequence data (DNA-seq), transcriptome sequence data (RNA-seq) and patient metadata for matched normal and primary tumor tissue samples from nine cancer patients were acquired from The TCGA (Weinstein et al., <xref ref-type="bibr" rid="B69">2013</xref>) via the Cancer Genomics Hub (CGHub) using the download client GeneTorrent (Maltbie et al., <xref ref-type="bibr" rid="B38">2013</xref>). The nine participants included three breast invasive carcinoma patients, three head and neck squamous cell carcinoma patients and three lung adenocarcinoma patients (Table <xref ref-type="table" rid="T1">1</xref>). DNA-seq and RNA-seq data were accessed as BAM files of paired-end Illumina sequence data aligned against the human genome reference sequence (build hg19). BAM files containing sequence alignments were validated for quality using FASTQC (Andrews, <xref ref-type="bibr" rid="B3">2011</xref>), and autosomes were extracted from the BAM files for downstream analysis using SAMtools (Li et al., <xref ref-type="bibr" rid="B37">2009</xref>).</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p><bold>TCGA whole genome (DNA-seq) and transcriptome (RNA-seq) data sources for the patients analyzed in this study</bold>.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>ID</bold></th>
<th valign="top" align="left"><bold>TCGA barcode</bold></th>
<th valign="top" align="left"><bold>Cancer type</bold></th>
<th valign="top" align="left"><bold>Sex</bold></th>
<th valign="top" align="left"><bold>Age</bold></th>
<th valign="top" align="left"><bold>Sample type<xref ref-type="table-fn" rid="TN1"><sup>a</sup></xref></bold></th>
<th valign="top" align="center"><bold>Seq depth</bold></th>
<th valign="top" align="center"><bold>Read len</bold>.</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Breast 1</td>
<td valign="top" align="left">TCGA-BH-A0B3-11B-21D-A128-09</td>
<td valign="top" align="left">Breast invasive carcinoma</td>
<td valign="top" align="left">F</td>
<td valign="top" align="left">53</td>
<td valign="top" align="left">NT-W</td>
<td valign="top" align="center">42.4</td>
<td valign="top" align="center">100</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-BH-A0B3-11B-21R-A089-07</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">NT-R</td>
<td valign="top" align="center">5.5</td>
<td valign="top" align="center">50</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-BH-A0B3-01A-11D-A128-09</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">TP-W</td>
<td valign="top" align="center">40.2</td>
<td valign="top" align="center">100</td>
</tr>
<tr style="border-bottom: thin solid #000000;">
<td/>
<td valign="top" align="left">TCGA-BH-A0B3-01B-21R-A089-07</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">TP-R</td>
<td valign="top" align="center">5.4</td>
<td valign="top" align="center">50</td>
</tr> <tr>
<td valign="top" align="left">Breast 2</td>
<td valign="top" align="left">TCGA-BH-A0BW-11A-12D-A314-09</td>
<td/>
<td valign="top" align="left">F</td>
<td valign="top" align="left">71</td>
<td valign="top" align="left">NT-W</td>
<td valign="top" align="center">54.1</td>
<td valign="top" align="center">100</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-BH-A0BW-11A-12R-A115-07</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">NT-R</td>
<td valign="top" align="center">7</td>
<td valign="top" align="center">50</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-BH-A0BW-01A-11D-A10Y-09</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">TP-W</td>
<td valign="top" align="center">46.1</td>
<td valign="top" align="center">100</td>
</tr>
<tr style="border-bottom: thin solid #000000;">
<td/>
<td valign="top" align="left">TCGA-BH-A0BW-01A-12R-A115-07</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">TP-R</td>
<td valign="top" align="center">7.3</td>
<td valign="top" align="center">50</td>
</tr> <tr>
<td valign="top" align="left">Breast 3</td>
<td valign="top" align="left">TCGA-BH-A0DT-11A-12D-A12B-09</td>
<td/>
<td valign="top" align="left">F</td>
<td valign="top" align="left">41</td>
<td valign="top" align="left">NT-W</td>
<td valign="top" align="center">63.3</td>
<td valign="top" align="center">100</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-BH-A0DT-11A-12R-A12D-07</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">NT-R</td>
<td valign="top" align="center">7.7</td>
<td valign="top" align="center">50</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-BH-A0DT-01A-21D-A12B-09</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">TP-W</td>
<td valign="top" align="center">79.9</td>
<td valign="top" align="center">100</td>
</tr>
<tr style="border-bottom: thin solid #000000;">
<td/>
<td valign="top" align="left">TCGA-BH-A0DT-01A-21R-A12D-07</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">TP-R</td>
<td valign="top" align="center">6.6</td>
<td valign="top" align="center">50</td>
</tr> <tr>
<td valign="top" align="left">Head 1</td>
<td valign="top" align="left">TCGA-CV-7255-11A-01D-2276-10</td>
<td valign="top" align="left">Head and neck squamous cell carcinoma</td>
<td valign="top" align="left">F</td>
<td valign="top" align="left">32</td>
<td valign="top" align="left">NT-W</td>
<td valign="top" align="center">6.9</td>
<td valign="top" align="center">101</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-CV-7255-11A-01R-2016-07</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">NT-R</td>
<td valign="top" align="center">7.5</td>
<td valign="top" align="center">48</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-CV-7255-01A-11D-2276-10</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">TP-W</td>
<td valign="top" align="center">5.8</td>
<td valign="top" align="center">101</td>
</tr>
<tr style="border-bottom: thin solid #000000;">
<td/>
<td valign="top" align="left">TCGA-CV-7255-01A-11R-2016-07</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">TP-R</td>
<td valign="top" align="center">7.1</td>
<td valign="top" align="center">48</td>
</tr> <tr>
<td valign="top" align="left">Head 2</td>
<td valign="top" align="left">TCGA-CV-7416-11A-01D-2334-08</td>
<td/>
<td valign="top" align="left">F</td>
<td valign="top" align="left">29</td>
<td valign="top" align="left">NT-W</td>
<td valign="top" align="center">7.7</td>
<td valign="top" align="center">101</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-CV-7416-11A-01R-2081-07</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">NT-R</td>
<td valign="top" align="center">5.9</td>
<td valign="top" align="center">48</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-CV-7416-01A-11D-2334-08</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">TP-W</td>
<td valign="top" align="center">28.6</td>
<td valign="top" align="center">101</td>
</tr>
<tr style="border-bottom: thin solid #000000;">
<td/>
<td valign="top" align="left">TCGA-CV-7416-01A-11R-2081-07</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">TP-R</td>
<td valign="top" align="center">6</td>
<td valign="top" align="center">48</td>
</tr> <tr>
<td valign="top" align="left">Head 3</td>
<td valign="top" align="left">TCGA-CV-6959-11A-01D-1911-02</td>
<td/>
<td valign="top" align="left">M</td>
<td valign="top" align="left">48</td>
<td valign="top" align="left">NT-W</td>
<td valign="top" align="center">38.3</td>
<td valign="top" align="center">51</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-CV-6959-11A-01R-1915-07</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">NT-R</td>
<td valign="top" align="center">8.5</td>
<td valign="top" align="center">48</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-CV-6959-01A-11D-1911-02</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">TP-W</td>
<td valign="top" align="center">31.4</td>
<td valign="top" align="center">51</td>
</tr>
<tr style="border-bottom: thin solid #000000;">
<td/>
<td valign="top" align="left">TCGA-CV-6959-01A-11R-1915-07</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">TP-R</td>
<td valign="top" align="center">6.6</td>
<td valign="top" align="center">48</td>
</tr> <tr>
<td valign="top" align="left">Lung 1</td>
<td valign="top" align="left">TCGA-44-6776-11A-01D-1853-02</td>
<td valign="top" align="left">Lung adenocarcinoma</td>
<td valign="top" align="left">F</td>
<td valign="top" align="left">60</td>
<td valign="top" align="left">NT-W</td>
<td valign="top" align="center">38.9</td>
<td valign="top" align="center">51</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-44-6776-11A-01R-1858-07</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">NT-R</td>
<td valign="top" align="center">5.4</td>
<td valign="top" align="center">48</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-44-6776-01A-11D-1853-02</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">TP-W</td>
<td valign="top" align="center">6.9</td>
<td valign="top" align="center">51</td>
</tr>
<tr style="border-bottom: thin solid #000000;">
<td/>
<td valign="top" align="left">TCGA-44-6776-01A-11R-1858-07</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">TP-R</td>
<td valign="top" align="center">7.4</td>
<td valign="top" align="center">48</td>
</tr> <tr>
<td valign="top" align="left">Lung 2</td>
<td valign="top" align="left">TCGA-50-5932-11A-01D-1753-08</td>
<td/>
<td valign="top" align="left">M</td>
<td valign="top" align="left">75</td>
<td valign="top" align="left">NT-W</td>
<td valign="top" align="center">34.6</td>
<td valign="top" align="center">101</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-50-5932-11A-01R-1755-07</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">NT-R</td>
<td valign="top" align="center">4.2</td>
<td valign="top" align="center">48</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-50-5932-01A-11D-1753-08</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">TP-W</td>
<td valign="top" align="center">44.5</td>
<td valign="top" align="center">101</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-50-5932-01A-11R-1755-07</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">TP-R</td>
<td valign="top" align="center">7.4</td>
<td valign="top" align="center">48</td>
</tr> <tr>
<td valign="top" align="left">Lung 3</td>
<td valign="top" align="left">TCGA-55-6984-11A-01D-1945-08</td>
<td/>
<td valign="top" align="left">F</td>
<td valign="top" align="left">NA</td>
<td valign="top" align="left">NT-W</td>
<td valign="top" align="center">36.2</td>
<td valign="top" align="center">101</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-55-6984-11A-01R-1949-07</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">NT-R</td>
<td valign="top" align="center">4.9</td>
<td valign="top" align="center">48</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-55-6984-01A-11D-1945-08</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">TP-W</td>
<td valign="top" align="center">41</td>
<td valign="top" align="center">101</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">TCGA-55-6984-01A-11R-1949-07</td>
<td/>
<td/>
<td/>
<td valign="top" align="left">TP-R</td>
<td valign="top" align="center">5.2</td>
<td valign="top" align="center">48</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="TN1">
<label>a</label>
<p><italic>NT-D, Normal tissue DNA-seq; NT-R, Normal tissue RNA-seq; TP-D, Tumor primary DNA-seq; TP-R, Tumor primary RNA-seq</italic>.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec>
<title>Gene and transposable element (TE) expression levels</title>
<p>Gene and TE expression levels were measured using RNA-seq data for the nine matched normal and primary tumor tissue samples. Gene expression levels were quantified as read counts mapped to NCBI RefSeq gene annotations (Pruitt et al., <xref ref-type="bibr" rid="B49">2012</xref>). TE expression levels&#x02014;for Alu, L1 and SVA elements&#x02014;were quantified using reads mapped to RepeatMasker annotations, which were subsequently analyzed with the TEtranscripts package (Jin et al., <xref ref-type="bibr" rid="B32">2015</xref>). The TEtranscripts program uses an expectation maximization (EM) algorithm to choose optimal unique TE locations for multi-mapped reads, thereby allowing for accurate expression level measurements for active TE families. The TEtranscripts method was recently shown to yield more reliable measures of TE transcription levels compared to previously published methods, such as HTSeq-count, Cufflinks, and RepEnrich (Trapnell et al., <xref ref-type="bibr" rid="B65">2010</xref>; Criscione et al., <xref ref-type="bibr" rid="B17">2014</xref>; Anders et al., <xref ref-type="bibr" rid="B2">2015</xref>). The L1Base database was used to identify the genomic locations of 145 full length, intact elements from the most recently active L1 subfamily (Penzkofer et al., <xref ref-type="bibr" rid="B47">2005</xref>). The set of full-length intact L1 sequences from the L1Base was generated by performing a BLAST search using the human genomic DNA sequences against the L1 template sequence (Penzkofer et al., <xref ref-type="bibr" rid="B47">2005</xref>). L1Base was used to facilitate measures of active L1 element expression by limiting our analysis to RNA-seq reads that map to full-length, intact L1 sequences which retain the potential to be transpositionally active. This was done in an effort to ensure that the reads we analyzed were taken from potentially active L1 elements as opposed to older fixed elements, which could represent read-through transcripts initiated from nearby genomic promoters. The expression levels of these potentially active L1 elements were analyzed separately using the TEtranscripts method.</p>
<p>Differential expression levels between normal and cancer tissue pairs, for genes and TEs, were evaluated by comparing distributions of log<sub>10</sub> transformed RNA-seq expression levels characterized as described above. The statistical significance levels of the observed differential expression between normal and cancer pairs were evaluated by comparing these distributions using the non-parametric Kolmogorov-Smirnov test. Statistical comparisons were done separately for each tissue (cancer) type: breast invasive carcinoma, head and neck squamous cell carcinoma and lung adenocarcinoma.</p>
 
</sec>
<sec>
<title>Transposable element insertion detection</title>
<p>The genomic locations of novel TE insertions from matched normal and primary tumor tissue samples were predicted based on discordant read-pair mapping of DNA-seq data (Ewing, <xref ref-type="bibr" rid="B23">2015</xref>) (Table <xref ref-type="table" rid="T2">2</xref>). A scheme of our TE insertion detection analysis pipeline is shown in Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">2</xref>. DNA-seq BAM files were realigned according to GATK&#x00027;s standard indel realignment method (Van der Auwera et al., <xref ref-type="bibr" rid="B67">2013</xref>) to facilitate TE insertion detection. The programs MELT (Sudmant et al., <xref ref-type="bibr" rid="B63">2015</xref>) and Mobster (Thung et al., <xref ref-type="bibr" rid="B64">2014</xref>) were used together for TE insertion detection. These two programs were selected owing to their previously demonstrated superior performance for human TE insertion detection (Rishishwar et al., <xref ref-type="bibr" rid="B52">2016</xref>). Only TE insertion sites that were found by both methods (i.e., the intersection of the predictions) were used for subsequent analysis. TE insertion predictions made by the individual programs were considered to represent the same insertion if they were found within &#x000B1;100 bp of each other. An additional filtering step was applied based on the number of mapped sequence reads (coverage) that support each TE insertion prediction. Only predictions with a minimum coverage of 5 reads and a maximum coverage of 4X the average sequencing depth of the sample were used for subsequent analysis. These upper and lower cut-off thresholds were empirically chosen based on the observed distributions of the numbers of discordant mapped read pairs used to call individual TE insertions. Read count distributions were computed individually for each program (MELT, Mobster) used and for each sample (Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">3</xref>). The resulting distributions were typically bimodal with a lower peak (i.e., with lower read count support) that we considered to be enriched for potential false positive TE insertion calls. The lower cut-off threshold of 5 reads was chosen to minimize such false positives, and the upper cut-off threshold was chosen to remove calls made in genomic regions that show anomalously high numbers of mapped reads, which tend to be enriched for ambiguously mapped reads.</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p><bold>Numbers of MELT and Mobster predicted TE insertions in matched normal (N) and primary tumor (T) samples across 9 individuals</bold>.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>Participant ID</bold></th>
<th valign="top" align="center" colspan="4" style="border-bottom: thin solid #000000;"><bold>TE insertions in matched normal tissue</bold></th>
<th valign="top" align="center" colspan="4" style="border-bottom: thin solid #000000;"><bold>TE insertions in tumor primary tissue</bold></th>
</tr>
<tr>
<th/>
<th valign="top" align="center"><bold>Alu</bold></th>
<th valign="top" align="center"><bold>SVA</bold></th>
<th valign="top" align="center"><bold>L1</bold></th>
<th valign="top" align="center"><bold>Total</bold></th>
<th valign="top" align="center"><bold>Alu</bold></th>
<th valign="top" align="center"><bold>SVA</bold></th>
<th valign="top" align="center"><bold>L1</bold></th>
<th valign="top" align="center"><bold>Total</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Breast 1</td>
<td valign="top" align="center">913</td>
<td valign="top" align="center">28</td>
<td valign="top" align="center">127</td>
<td valign="top" align="center">1069</td>
<td valign="top" align="center">853</td>
<td valign="top" align="center">33</td>
<td valign="top" align="center">110</td>
<td valign="top" align="center">997</td>
</tr>
<tr>
<td valign="top" align="left">Breast 2</td>
<td valign="top" align="center">1004</td>
<td valign="top" align="center">21</td>
<td valign="top" align="center">121</td>
<td valign="top" align="center">1147</td>
<td valign="top" align="center">1160</td>
<td valign="top" align="center">54</td>
<td valign="top" align="center">143</td>
<td valign="top" align="center">1358</td>
</tr>
<tr>
<td valign="top" align="left">Breast 3</td>
<td valign="top" align="center">1012</td>
<td valign="top" align="center">63</td>
<td valign="top" align="center">139</td>
<td valign="top" align="center">1215</td>
<td valign="top" align="center">952</td>
<td valign="top" align="center">60</td>
<td valign="top" align="center">136</td>
<td valign="top" align="center">149</td>
</tr>
<tr>
<td valign="top" align="left">Head 1</td>
<td valign="top" align="center">984</td>
<td valign="top" align="center">72</td>
<td valign="top" align="center">140</td>
<td valign="top" align="center">1197</td>
<td valign="top" align="center">741</td>
<td valign="top" align="center">66</td>
<td valign="top" align="center">107</td>
<td valign="top" align="center">915</td>
</tr>
<tr>
<td valign="top" align="left">Head 2</td>
<td valign="top" align="center">945</td>
<td valign="top" align="center">25</td>
<td valign="top" align="center">131</td>
<td valign="top" align="center">1102</td>
<td valign="top" align="center">832</td>
<td valign="top" align="center">26</td>
<td valign="top" align="center">138</td>
<td valign="top" align="center">997</td>
</tr>
<tr>
<td valign="top" align="left">Head 3</td>
<td valign="top" align="center">860</td>
<td valign="top" align="center">36</td>
<td valign="top" align="center">108</td>
<td valign="top" align="center">1005</td>
<td valign="top" align="center">819</td>
<td valign="top" align="center">41</td>
<td valign="top" align="center">112</td>
<td valign="top" align="center">973</td>
</tr>
<tr>
<td valign="top" align="left">Lung 1</td>
<td valign="top" align="center">716</td>
<td valign="top" align="center">29</td>
<td valign="top" align="center">92</td>
<td valign="top" align="center">838</td>
<td valign="top" align="center">780</td>
<td valign="top" align="center">36</td>
<td valign="top" align="center">113</td>
<td valign="top" align="center">930</td>
</tr>
<tr>
<td valign="top" align="left">Lung 2</td>
<td valign="top" align="center">806</td>
<td valign="top" align="center">25</td>
<td valign="top" align="center">103</td>
<td valign="top" align="center">935</td>
<td valign="top" align="center">701</td>
<td valign="top" align="center">20</td>
<td valign="top" align="center">94</td>
<td valign="top" align="center">816</td>
</tr>
<tr>
<td valign="top" align="left">Lung 3</td>
<td valign="top" align="center">856</td>
<td valign="top" align="center">21</td>
<td valign="top" align="center">110</td>
<td valign="top" align="center">988</td>
<td valign="top" align="center">746</td>
<td valign="top" align="center">14</td>
<td valign="top" align="center">100</td>
<td valign="top" align="center">861</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The number of observed versus expected counts of unique L1 insertions were compared for matched normal and primary tumor tissue samples. The observed counts were taken from the TE detection pipeline, and the expected counts were computed as the ratio of unique insertions seen in matched normal vs. primary tissue for all TEs multiplied by the total number of observed L1 insertions. The significance of the difference between the observed versus expected counts of unique L1 insertions was evaluated using the Fisher&#x00027;s exact test. Counts of TE insertions for matched normal and primary tumor tissue samples were characterized based on their frequencies from the 1000 Genomes Project (1KGP) (Sudmant et al., <xref ref-type="bibr" rid="B63">2015</xref>) and grouped into three distinct frequency bins. The distributions of TE insertion counts across the three frequency bins were compared for matched normal and cancer samples for the different tissue types analyzed here, and the significance of the differences between these distributions were evaluated using the Kolmogorov-Smirnov test.</p>
</sec>
<sec>
<title>TE insertion genome feature analysis</title>
<p>The genomic locations of novel TE insertions were considered with respect to several genomic features using the BEDTools program (Quinlan, <xref ref-type="bibr" rid="B50">2014</xref>): RefSeq genes (Pruitt et al., <xref ref-type="bibr" rid="B49">2012</xref>), COSMIC tumor suppressor genes (Forbes et al., <xref ref-type="bibr" rid="B25">2015</xref>), and enhancer elements defined by chromatin states (Roadmap Epigenomics et al., <xref ref-type="bibr" rid="B54">2015</xref>). The population allele frequencies of the predicted TE insertions were computed from the Phase 3 release of the 1KGP (Sudmant et al., <xref ref-type="bibr" rid="B63">2015</xref>) as previously described (Rishishwar et al., <xref ref-type="bibr" rid="B53">2015</xref>).</p>
</sec>
</sec>
<sec id="s3">
<title>Results and discussion</title>
<sec>
<title>TE expression levels in matched normal vs. primary tumor tissue samples</title>
<p>RNA-seq data were used to evaluate the differences in TE expression levels between matched normal and primary tumor tissue samples as described in the Materials and Methods. The observed differences in gene expression levels between normal and tumor tissue were compared to differences in TE expression levels for breast invasive carcinoma, head, and neck squamous cell carcinoma and lung adenocarcinoma. There are no significant differences observed for the distributions of gene expression levels between matched normal and primary tumor tissue pairs for any of the three cancer types analyzed here (Figure <xref ref-type="fig" rid="F2">2</xref>). Similarly, when all three families of potentially active TEs (Alu, L1, and SVA) are considered together, there is no significant difference seen for the overall levels of expression between matched normal and tumor tissue. However, when full-length, potentially active L1 sequences are considered alone, we observe statistically significant increases in L1 expression levels for all three cancer types.</p>
<fig id="F2" position="float">
<label>Figure 2</label>
<caption><p><bold>Gene expression levels for matched normal vs. primary tumor tissue pairs</bold>. Normal tissue (NT) and tumor primary (TP) expression levels were measured for genes, transposable elements (TEs) and LINE1 elements (L1s) via analysis of RNA-seq data as described in the Materials and Methods. Expression levels are shown as distributions of log<sub>10</sub> transformed read counts, and normal versus tumor comparisons are shown for breast invasive carcinoma (green), head and neck squamous cell carcinoma (red), and lung adenocarcinoma (blue). For each tissue type, the significance levels of the differences in L1 expression between normal and cancer pairs are indicated with <italic>P</italic>-values from the Kolmogorov-Smirnov test.</p></caption>
<graphic xlink:href="fmolb-03-00076-g0002.tif"/>
</fig>
<p>The methods that we used to characterize TE expression levels include several analytical controls aimed to ensure that only genuine TE-initiated transcripts, from members of potentially active families, are measured. Nevertheless, the lack of a difference between normal and tumor expression levels observed when all three active TE families were considered together could reflect technical difficulties with identifying <italic>bona fide</italic> TE transcripts that are initiated from element promoters as opposed to TE sequences that are passively expressed as part of longer genic transcripts. This is particularly true for Alu elements, many of which are found in the introns of human genes and transcribed as read-through transcripts initiated from RNA Pol II gene promoters (Deininger, <xref ref-type="bibr" rid="B19">2011</xref>). Our confidence in the ability to measure L1-initiated transcripts is higher owing to the focus on previously identified full-length, intact elements that are located in intergenic regions. In any case, the up-regulation of L1s in cancer that we observed has potential implications for increased TE insertional activity for all three families, since L1 encoded proteins are responsible for the <italic>cis</italic> retrotransposition of L1s as well as the <italic>trans</italic> activation of Alu and SVA elements (Batzer and Deininger, <xref ref-type="bibr" rid="B8">2002</xref>; Hancks and Kazazian, <xref ref-type="bibr" rid="B27">2010</xref>). We analyzed the same pairs of matched normal and primary tumor tissues to evaluate whether the observed increase in L1 expression corresponds to increased transpositional activity of human TEs.</p>
</sec>
<sec>
<title>Novel TE insertions in matched normal and primary tumor tissue samples</title>
<p>It is now possible to characterize the genomic locations and copy numbers of individual TE insertions from whole genome DNA-seq data owing to recent developments in computational genomics software (Ewing, <xref ref-type="bibr" rid="B23">2015</xref>; Rishishwar et al., <xref ref-type="bibr" rid="B52">2016</xref>). This technological advance is exemplified by the recent Phase 3 release of the 1KGP, which includes a complete genome-wide census of polymorphic TE insertion sites for 2504 individuals across 26 human populations (Sudmant et al., <xref ref-type="bibr" rid="B63">2015</xref>). We analyzed whole genome DNA-seq data using computational methods for TE insertion detection (see Materials and Methods) in order to compare TE insertional activity between matched normal versus primary tumor tissue samples.</p>
<p>When all three families of active human TEs are considered together, we observed a total of 3672 TE insertions across the nine individuals analyzed for normal and cancer tissue pairs, 693 of which are unique insertions found in only one individual and one tissue type. In other words, we observe an average of &#x0007E;77 unique somatic TE insertions per person, i.e., &#x0201C;private&#x0201D; TE insertions. This estimate is similar to the value of &#x0007E;90 unique (presumably germline) TE insertions that we previously observed for individuals from the 1KGP (Rishishwar et al., <xref ref-type="bibr" rid="B53">2015</xref>). A large majority of the observed TE insertions&#x02014;81% for all TEs and 62% for L1s alone&#x02014;are shared between the normal and tumor tissue types of an individual, suggesting that they represent germline insertions (Figure <xref ref-type="fig" rid="F3">3A</xref>). There are 1.3x more unique TE insertions seen for tumor compared to normal tissue, and this effect is more pronounced for L1s alone, which are 2x more abundant in tumor tissue samples. Accordingly, there is a statistically significant excess of observed versus expected L1 insertions in tumor versus normal tissue (<italic>P</italic> &#x0003D; 0.019) (Figure <xref ref-type="fig" rid="F3">3B</xref>). These results are consistent with a potential role for L1 transpositional activity in tumorigenesis for the cancer types analyzed here, as has been previously suggested for several different cancers (Morse et al., <xref ref-type="bibr" rid="B44">1988</xref>; Iskow et al., <xref ref-type="bibr" rid="B31">2010</xref>; Lee et al., <xref ref-type="bibr" rid="B36">2012</xref>; Scott et al., <xref ref-type="bibr" rid="B57">2016</xref>).</p>
<fig id="F3" position="float">
<label>Figure 3</label>
<caption><p><bold>TE insertional activity in matched normal vs. primary tumor tissue pairs</bold>. The number of TE insertions were measured for normal and primary tumor tissue pairs for breast invasive carcinoma, head, and neck squamous cell carcinoma and lung adenocarcinoma via analysis of whole genome DNA-seq data as described in the Materials and Methods. <bold>(A)</bold> The total number of predicted TE insertions, pooled for all nine individuals over the three cancer types analyzed here, are shown for normal vs. tumor tissue. Venn diagrams show the numbers of unique versus shared TE insertions for the two tissue types. <bold>(B)</bold> Comparison of the observed versus expected numbers of unique L1 insertions for normal vs. tumor tissue. <bold>(C)</bold> Comparison of the population frequencies of observed TE insertions in matched normal vs. tumor tissue pairs are shown for all of the TEs analyzed here and for L1s alone. <bold>(D&#x02013;F)</bold> The same comparisons of TE insertion population frequencies are shown individually for each cancer type analyzed here. TE insertion population frequencies are color coded as shown in the key. <italic>P</italic>-values show the significance of the differences for observed distributions based on the Fisher&#x00027;s exact test <bold>(B)</bold> and the Kolmogorov-Smirnov test <bold>(C&#x02013;F)</bold>.</p></caption>
<graphic xlink:href="fmolb-03-00076-g0003.tif"/>
</fig>
<p>Given the relatively high level of L1 insertional activity in the tumor tissue samples analyzed here, we tested whether tumor-specific L1 insertions are found at lower frequencies among the (presumably) healthy donors from the 1KGP compared to L1 insertions found in matched normal tissue. The idea was to evaluate whether the tumor-specific L1 insertions represent mutations that are private, and thereby more likely to be deleterious or disease-causing. To do this, individual TE insertions were classified as high frequency (&#x0003E;0.05), low frequency (&#x0003C;0.05) or private (absent) according to their previously characterized population (allele) frequencies from the 1KGP (Rishishwar et al., <xref ref-type="bibr" rid="B53">2015</xref>; Sudmant et al., <xref ref-type="bibr" rid="B63">2015</xref>).</p>
<p>When all three cancer types are considered together, there is a statistically significant excess of private and low frequency TE insertions observed for tumor compared to normal tissue (<italic>P</italic> &#x0003D; 1.9e-61) (Figure <xref ref-type="fig" rid="F3">3C</xref>). This effect is even more pronounced when L1 insertions are considered alone (<italic>P</italic> &#x0003D; 2.7e-23). The same pattern of an increased frequency of private L1 insertions in tumor tissue is observed (<italic>P</italic> &#x0003C; 2.0e-7) when all three cancer types are analyzed for sets of patients (Figures <xref ref-type="fig" rid="F3">3D&#x02013;F</xref>) and when samples for individual patients are analyzed separately (Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">4</xref>). The strongest effect is seen for head and neck squamous cell carcinoma. The pattern of a significant excess of private L1 insertions in tumor compared to normal tissue, observed for all three cancer types studied here, provides further evidence in support of a possible role for L1 activity in tumorigenesis.</p>
<p>It should be noted TE insertions found in low copy numbers may not be detectable using next-generation sequence analysis, whereas such insertions may be uncovered using more sensitive PCR-based approaches. False negatives of this kind will be more prevalent at low levels of sequence coverage. We have tried to control for this by using relatively high sequence coverage (&#x0007E;35X) studies here, but the conservative lower read count cut-off of 5 reads per TE insertion call that we used may still lead to missing TE insertion calls. Sequence based predictions can also yield false-positive TE insertion calls. In an effort to deal with this issue, we have only used high-confidence calls produced by two independent programs&#x02014;MELT and Mobster&#x02014;that we have recently shown to be most reliable for the detection of human TE insertions (Rishishwar et al., <xref ref-type="bibr" rid="B52">2016</xref>).</p>
<p>One other potential problem with the sequence based analysis relates to the base pair resolution with which TE insertions can be called via computational analysis of next-generation sequence data. Currently, the most accurate programs for calling TE insertions from next-generation sequence data do not yet allow for the insertions to be precisely located to genomic regions at single base pair resolution. To account for this fact, TE insertions called within a window of &#x000B1;100 bp are considered to be co-located (Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">2</xref>). It is possible that this approximation can lead to multiple TE insertion events being collapsed into a single event. Subsequent experimental confirmation of individual TE insertion calls of interest (e.g., potentially tumorigenic TE insertions) should help to provide certainty with respect to both their validity and their precise genomic locations.</p>
</sec>
<sec>
<title>Potentially tumorigenic TE insertions</title>
<p>Having established a potential role for transpositional activity in tumorigenesis using the genome-wide approaches described above, we wanted to search for specific examples where individual TE insertions could be implicated as possible cancer driver mutations. To do so, we performed an integrated analysis of TE insertion, gene expression and chromatin data (see Materials and Methods) in an effort to identify the cancer-specific TE insertions that are most likely to play a causal role in tumorigenesis. We considered TE insertions that are co-located with either exons or regulatory elements of previously characterized tumor suppressor genes to have the highest likelihood of being functionally relevant. We observed a total of 141 intragenic (35.9%) insertions and 246 intronic insertions (62.6%) out of the 393 total cancer-specific insertions in our dataset. None of these intergenic or intronic cancer-specific TE insertions were found to disrupt any known functional (regulatory) sequence element. Thus, consistent with previous studies, the vast majority of TE insertions that we observed are not likely to affect gene function or expression in cancer. We did find 4 exonic TE insertions, along with 2 insertions located in regulatory elements, for known tumor suppressor genes (1.5% of the total). Here, we focus on two of these potential cases of cancer driver TE insertions, which could prove to be of interest to the TE and/or cancer research communities.</p>
<p>There is a private, breast cancer tumor-specific Alu insertion that is located within an upstream enhancer element that helps to regulate the expression of the Cbl Proto-Oncogene (<italic>CBL</italic>) gene (Figure <xref ref-type="fig" rid="F4">4A</xref>). <italic>CBL</italic> is classified as a tumor suppressor gene by the COSMIC database (Forbes et al., <xref ref-type="bibr" rid="B25">2015</xref>). It has been found to be mutated or translocated in a number of cancers including acute myeloid leukemia (Abbas et al., <xref ref-type="bibr" rid="B1">2008</xref>; Naramura et al., <xref ref-type="bibr" rid="B45">2011</xref>; Aranaz et al., <xref ref-type="bibr" rid="B4">2013</xref>); mutations in <italic>CBL</italic> are also the cause of Noonan syndrome-like disorder (Martinelli et al., <xref ref-type="bibr" rid="B39">2010</xref>). The <italic>CBL</italic> encoded protein functions as a negative regulator of signal transduction pathways (Schmidt and Dikic, <xref ref-type="bibr" rid="B56">2005</xref>), activation of which have been associated with cancer (Sever and Brugge, <xref ref-type="bibr" rid="B58">2015</xref>). The tumor-specific Alu enhancer insertion that we characterized is associated with down-regulation of <italic>CBL</italic> expression, consistent with a potential role in tumorigenesis via the activation of signal transduction pathways associated with cell proliferation (Sever and Brugge, <xref ref-type="bibr" rid="B58">2015</xref>).</p>
<fig id="F4" position="float">
<label>Figure 4</label>
<caption><p><bold>Private TE insertions implicated as potential cancer driver mutations. (A)</bold> A tumor-specific Alu insertion (red) is found in a single breast cancer patient. The insertion is located within an upstream enhancer for the <italic>CBL</italic> gene on chromosome 11 (gene model shown in blue), as indicated by enhancer-associated chromatin marks (inset yellow bars). Presence of the Alu insertion is associated with down-regulation of <italic>CBL</italic> (expression levels in green). <bold>(B)</bold> A tumor-specific L1 insertion (red) is located within the first exon of the <italic>BAALC</italic> gene on chromosome 8 (gene model shown in blue). Co-location of the L1 insertion with promoter-associated chromatin marks (purple bars) is shown in the inset. Presence of the L1 insertion is associated with down-regulation of <italic>BAALC</italic> (expression levels in red).</p></caption>
<graphic xlink:href="fmolb-03-00076-g0004.tif"/>
</fig>
<p>We also found a private L1 insertion that was unique to a head and neck squamous cell carcinoma tissue sample, located within the first exon of the Brain and Acute Leukemia, Cytoplasmic (<italic>BAALC</italic>) gene (Figure <xref ref-type="fig" rid="F4">4B</xref>). As its name implies, the <italic>BAALC</italic> gene is expressed in the brain and related neural tissues, and it was first identified by association with acute myeloid leukemia where it was shown to be overexpressed (Damiani et al., <xref ref-type="bibr" rid="B18">2013</xref>; Zhou et al., <xref ref-type="bibr" rid="B71">2015</xref>). TE insertions within exons are extremely rare and would presumably have a dramatic effect on gene function. Indeed, this particular insertion is associated with nearly complete inactivation of the <italic>BAALC</italic> gene. This is consistent with previous results showing that the presence of fixed L1 insertions genome-wide is strongly associated with the down-regulation of human gene expression (Han et al., <xref ref-type="bibr" rid="B26">2004</xref>). A recent study has demonstrated that <italic>BAALC</italic> can inhibit extracellular signal-regulated kinase (ERK) mediated monocytic differentiation of AML cells (Morita et al., <xref ref-type="bibr" rid="B43">2015</xref>). Thus, down-regulation of <italic>BAALC</italic> would presumably result in a loss of control over cellular differentiation, consistent with a possible role in tumorigenesis. A recent study discovered a role for the change in methylation status of a cancer-specific L1 insertion in tumorigenesis (Scott et al., <xref ref-type="bibr" rid="B57">2016</xref>); this could be an additional mechanism by which the <italic>BAALC</italic> L1 insertion observed here exerts a regulatory effect.</p>
</sec>
</sec>
<sec sec-type="conclusions" id="s4">
<title>Conclusion</title>
<p>The results of our analysis show a surprisingly high level of somatic TE activity in the human genome. Abundant transcripts from members of all three active human TE families analyzed here&#x02014;Alu, SVA and L1&#x02014;can be identified for both normal and cancer tissue samples. In addition, after filtering for high confidence TE insertion calls, we identified an average of close to 80 unique insertions for each tissue among the individual patients in our study. Thus, active human TE families retain the ability to transpose in somatic tissue thereby generating substantial levels of cellular heterogeneity among diverse tissues.</p>
<p>We also observe a correlated increase in both transcript expression levels and transpositional activity for L1 elements in cancer tissue samples when compared to matched normal tissue. Increased cancer expression of L1 elements is particularly relevant for TE insertional activity, since the L1 transpositional machinery is responsible for transposing non-autonomous Alu and SVA elements in <italic>trans</italic> along with L1 elements in <italic>cis</italic>. Our results are consistent with previous studies showing expression of L1 transcripts in lung cancer (Belancio et al., <xref ref-type="bibr" rid="B11">2010b</xref>) and expression of L1 ORF1p in breast cancer (Harris et al., <xref ref-type="bibr" rid="B29">2010</xref>), and tumor-specific L1 insertions have also previously been found in breast (Morse et al., <xref ref-type="bibr" rid="B44">1988</xref>), head and neck (Helman et al., <xref ref-type="bibr" rid="B30">2014</xref>), and lung tumors (Helman et al., <xref ref-type="bibr" rid="B30">2014</xref>). We confirmed the presence of numerous tumor-specific L1 insertions in these three cancer types and identify two potentially tumorigenic TE insertions, an Alu insertion in the enhancer region of the tumor suppressor gene <italic>CBL</italic> and an L1 insertion in the first exon of the <italic>BAALC</italic> gene. These results underscore the potential for somatic TE activity to generate cellular heterogeneity and to contribute to the etiology of cancer across a wide range of human tissues.</p>
</sec>
<sec id="s5">
<title>Ethics statement</title>
<p>Ethical approval was not required for this study on restricted access, de-identified data in accordance with the guidelines of the Cancer Genome Atlas (TCGA). Access to the data was approved by the data access committee of the TCGA.</p>
</sec>
<sec id="s6">
<title>Author contributions</title>
<p>EC, LW, and LR performed all of the analyses described in the study. JW contributed to the genome feature analysis. IJ and JM conceived of designed and supervised the study. All authors contributed to the drafting and revision of the manuscript.</p>
</sec>
<sec id="s7">
<title>Funding</title>
<p>EC and LW were supported by the Georgia Tech Bioinformatics Graduate Program. LR and IJ were supported by the IHRC-Georgia Tech Applied Bioinformatics Laboratory (ABiL).</p>
<sec>
<title>Conflict of interest statement</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</sec>
</body>
<back>
<ack><p>The results published here are in whole or part based upon data generated by The Cancer Genome Atlas managed by the NCI and NHGRI. Information about TCGA can be found at <ext-link ext-link-type="uri" xlink:href="http://cancergenome.nih.gov">http://cancergenome.nih.gov</ext-link>. The authors thank Emily Norris for feedback on the manuscript.</p>
</ack>
<sec sec-type="supplementary-material" id="s8">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="http://journal.frontiersin.org/article/10.3389/fmolb.2016.00076/full#supplementary-material">http://journal.frontiersin.org/article/10.3389/fmolb.2016.00076/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Image1.pdf" id="SM1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Abbas</surname> <given-names>S.</given-names></name> <name><surname>Rotmans</surname> <given-names>G.</given-names></name> <name><surname>L&#x000F6;wenberg</surname> <given-names>B.</given-names></name> <name><surname>Valk</surname> <given-names>P. J.</given-names></name></person-group> (<year>2008</year>). <article-title>Exon 8 splice site mutations in the gene encoding the E3-ligase CBL are associated with core binding factor acute myeloid leukemias</article-title>. <source>Haematologica</source> <volume>93</volume>, <fpage>1595</fpage>&#x02013;<lpage>1597</lpage>. <pub-id pub-id-type="doi">10.3324/haematol.13187</pub-id><pub-id pub-id-type="pmid">18698078</pub-id></citation>
</ref>
<ref id="B2">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Anders</surname> <given-names>S.</given-names></name> <name><surname>Pyl</surname> <given-names>P. T.</given-names></name> <name><surname>Huber</surname> <given-names>W.</given-names></name></person-group> (<year>2015</year>). <article-title>HTSeq&#x02013;a Python framework to work with high-throughput sequencing data</article-title>. <source>Bioinformatics</source> <volume>31</volume>, <fpage>166</fpage>&#x02013;<lpage>169</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu638</pub-id><pub-id pub-id-type="pmid">25260700</pub-id></citation>
</ref>
<ref id="B3">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Andrews</surname> <given-names>S.</given-names></name></person-group> (<year>2011</year>). <source>FastQC A Quality Control Tool for High Throughput Sequence Data</source>. <publisher-loc>Cambridge</publisher-loc>: <publisher-name>Babraham Institute</publisher-name>.</citation>
</ref>
<ref id="B4">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Aranaz</surname> <given-names>P.</given-names></name> <name><surname>Migu&#x000E9;liz</surname> <given-names>I.</given-names></name> <name><surname>Hurtado</surname> <given-names>C.</given-names></name> <name><surname>Erquiaga</surname> <given-names>I.</given-names></name> <name><surname>Larrayoz</surname> <given-names>M. J.</given-names></name> <name><surname>Calasanz</surname> <given-names>M. J.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>CBL RING finger deletions are common in core-binding factor acute myeloid leukemias</article-title>. <source>Leuk. Lymphoma</source> <volume>54</volume>, <fpage>428</fpage>&#x02013;<lpage>431</lpage>. <pub-id pub-id-type="doi">10.3109/10428194.2012.709629</pub-id><pub-id pub-id-type="pmid">22799433</pub-id></citation>
</ref>
<ref id="B5">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Asch</surname> <given-names>H. L.</given-names></name> <name><surname>Eliacin</surname> <given-names>E.</given-names></name> <name><surname>Fanning</surname> <given-names>T. G.</given-names></name> <name><surname>Connolly</surname> <given-names>J. L.</given-names></name> <name><surname>Bratthauer</surname> <given-names>G.</given-names></name> <name><surname>Asch</surname> <given-names>B. B.</given-names></name></person-group> (<year>1996</year>). <article-title>Comparative expression of the LINE-1 p40 protein in human breast carcinomas and normal breast tissues</article-title>. <source>Oncol. Res.</source> <volume>8</volume>, <fpage>239</fpage>&#x02013;<lpage>247</lpage>. <pub-id pub-id-type="pmid">8895199</pub-id></citation>
</ref>
<ref id="B6">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Baillie</surname> <given-names>J. K.</given-names></name> <name><surname>Barnett</surname> <given-names>M. W.</given-names></name> <name><surname>Upton</surname> <given-names>K. R.</given-names></name> <name><surname>Gerhardt</surname> <given-names>D. J.</given-names></name> <name><surname>Richmond</surname> <given-names>T. A.</given-names></name> <name><surname>De Sapio</surname> <given-names>F.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>Somatic retrotransposition alters the genetic landscape of the human brain</article-title>. <source>Nature</source> <volume>479</volume>, <fpage>534</fpage>&#x02013;<lpage>537</lpage>. <pub-id pub-id-type="doi">10.1038/nature10531</pub-id><pub-id pub-id-type="pmid">22037309</pub-id></citation>
</ref>
<ref id="B7">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Batzer</surname> <given-names>M. A.</given-names></name> <name><surname>Deininger</surname> <given-names>P. L.</given-names></name></person-group> (<year>1991</year>). <article-title>A human-specific subfamily of Alu sequences</article-title>. <source>Genomics</source> <volume>9</volume>, <fpage>481</fpage>&#x02013;<lpage>487</lpage>. <pub-id pub-id-type="doi">10.1016/0888-7543(91)90414-A</pub-id><pub-id pub-id-type="pmid">1851725</pub-id></citation>
</ref>
<ref id="B8">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Batzer</surname> <given-names>M. A.</given-names></name> <name><surname>Deininger</surname> <given-names>P. L.</given-names></name></person-group> (<year>2002</year>). <article-title>Alu repeats and human genomic diversity</article-title>. <source>Nat. Rev. Genet.</source> <volume>3</volume>, <fpage>370</fpage>&#x02013;<lpage>379</lpage>. <pub-id pub-id-type="doi">10.1038/nrg798</pub-id><pub-id pub-id-type="pmid">11988762</pub-id></citation>
</ref>
<ref id="B9">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Batzer</surname> <given-names>M. A.</given-names></name> <name><surname>Gudi</surname> <given-names>V. A.</given-names></name> <name><surname>Mena</surname> <given-names>J. C.</given-names></name> <name><surname>Foltz</surname> <given-names>D. W.</given-names></name> <name><surname>Herrera</surname> <given-names>R. J.</given-names></name> <name><surname>Deininger</surname> <given-names>P. L.</given-names></name></person-group> (<year>1991</year>). <article-title>Amplification dynamics of human-specific (HS) Alu family members</article-title>. <source>Nucleic Acids Res.</source> <volume>19</volume>, <fpage>3619</fpage>&#x02013;<lpage>3623</lpage>. <pub-id pub-id-type="doi">10.1093/nar/19.13.3619</pub-id><pub-id pub-id-type="pmid">1649453</pub-id></citation>
</ref>
<ref id="B10">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Belancio</surname> <given-names>V. P.</given-names></name> <name><surname>Roy-Engel</surname> <given-names>A. M.</given-names></name> <name><surname>Deininger</surname> <given-names>P. L.</given-names></name></person-group> (<year>2010a</year>). <article-title>All y&#x00027;all need to know &#x00027;bout retroelements in cancer</article-title>. <source>Semin. Cancer Biol.</source> <volume>20</volume>, <fpage>200</fpage>&#x02013;<lpage>210</lpage>. <pub-id pub-id-type="doi">10.1016/j.semcancer.2010.06.001</pub-id><pub-id pub-id-type="pmid">20600922</pub-id></citation>
</ref>
<ref id="B11">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Belancio</surname> <given-names>V. P.</given-names></name> <name><surname>Roy-Engel</surname> <given-names>A. M.</given-names></name> <name><surname>Pochampally</surname> <given-names>R. R.</given-names></name> <name><surname>Deininger</surname> <given-names>P.</given-names></name></person-group> (<year>2010b</year>). <article-title>Somatic expression of LINE-1 elements in human tissues</article-title>. <source>Nucleic Acids Res.</source> <volume>38</volume>, <fpage>3909</fpage>&#x02013;<lpage>3922</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkq132</pub-id><pub-id pub-id-type="pmid">20215437</pub-id></citation>
</ref>
<ref id="B12">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bratthauer</surname> <given-names>G. L.</given-names></name> <name><surname>Cardiff</surname> <given-names>R. D.</given-names></name> <name><surname>Fanning</surname> <given-names>T. G.</given-names></name></person-group> (<year>1994</year>). <article-title>Expression of LINE-1 retrotransposons in human breast cancer</article-title>. <source>Cancer</source> <volume>73</volume>, <fpage>2333</fpage>&#x02013;<lpage>2336</lpage>. <pub-id pub-id-type="pmid">8168038</pub-id></citation>
</ref>
<ref id="B13">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bratthauer</surname> <given-names>G. L.</given-names></name> <name><surname>Fanning</surname> <given-names>T. G.</given-names></name></person-group> (<year>1992</year>). <article-title>Active LINE-1 retrotransposons in human testicular cancer</article-title>. <source>Oncogene</source> <volume>7</volume>, <fpage>507</fpage>&#x02013;<lpage>510</lpage>. <pub-id pub-id-type="pmid">1312702</pub-id></citation>
</ref>
<ref id="B14">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bratthauer</surname> <given-names>G. L.</given-names></name> <name><surname>Fanning</surname> <given-names>T. G.</given-names></name></person-group> (<year>1993</year>). <article-title>LINE-1 retrotransposon expression in pediatric germ cell tumors</article-title>. <source>Cancer</source> <volume>71</volume>, <fpage>2383</fpage>&#x02013;<lpage>2386</lpage>. <pub-id pub-id-type="pmid">8384068</pub-id></citation>
</ref>
<ref id="B15">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Brouha</surname> <given-names>B.</given-names></name> <name><surname>Schustak</surname> <given-names>J.</given-names></name> <name><surname>Badge</surname> <given-names>R. M.</given-names></name> <name><surname>Lutz-Prigge</surname> <given-names>S.</given-names></name> <name><surname>Farley</surname> <given-names>A. H.</given-names></name> <name><surname>Moran</surname> <given-names>J. V.</given-names></name> <etal/></person-group>. (<year>2003</year>). <article-title>Hot L1s account for the bulk of retrotransposition in the human population</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>100</volume>, <fpage>5280</fpage>&#x02013;<lpage>5285</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0831042100</pub-id><pub-id pub-id-type="pmid">12682288</pub-id></citation>
</ref>
<ref id="B16">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carreira</surname> <given-names>P. E.</given-names></name> <name><surname>Richardson</surname> <given-names>S. R.</given-names></name> <name><surname>Faulkner</surname> <given-names>G. J.</given-names></name></person-group> (<year>2014</year>). <article-title>L1 retrotransposons, cancer stem cells and oncogenesis</article-title>. <source>FEBS J.</source> <volume>281</volume>, <fpage>63</fpage>&#x02013;<lpage>73</lpage>. <pub-id pub-id-type="doi">10.1111/febs.12601</pub-id><pub-id pub-id-type="pmid">24286172</pub-id></citation>
</ref>
<ref id="B17">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Criscione</surname> <given-names>S. W.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name> <name><surname>Thompson</surname> <given-names>W.</given-names></name> <name><surname>Sedivy</surname> <given-names>J. M.</given-names></name> <name><surname>Neretti</surname> <given-names>N.</given-names></name></person-group> (<year>2014</year>). <article-title>Transcriptional landscape of repetitive elements in normal and cancer human cells</article-title>. <source>BMC Genomics</source> <volume>15</volume>:<fpage>583</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2164-15-583</pub-id><pub-id pub-id-type="pmid">25012247</pub-id></citation>
</ref>
<ref id="B18">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Damiani</surname> <given-names>D.</given-names></name> <name><surname>Tiribelli</surname> <given-names>M.</given-names></name> <name><surname>Franzoni</surname> <given-names>A.</given-names></name> <name><surname>Michelutti</surname> <given-names>A.</given-names></name> <name><surname>Fabbro</surname> <given-names>D.</given-names></name> <name><surname>Cavallin</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>BAALC overexpression retains its negative prognostic role across all cytogenetic risk groups in acute myeloid leukemia patients</article-title>. <source>Am. J. Hematol.</source> <volume>88</volume>, <fpage>848</fpage>&#x02013;<lpage>852</lpage>. <pub-id pub-id-type="doi">10.1002/ajh.23516</pub-id><pub-id pub-id-type="pmid">23760853</pub-id></citation>
</ref>
<ref id="B19">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Deininger</surname> <given-names>P.</given-names></name></person-group> (<year>2011</year>). <article-title>Alu elements: know the SINEs</article-title>. <source>Genome Biol.</source> <volume>12</volume>:<fpage>236</fpage>. <pub-id pub-id-type="doi">10.1186/gb-2011-12-12-236</pub-id><pub-id pub-id-type="pmid">22204421</pub-id></citation>
</ref>
<ref id="B20">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>de Koning</surname> <given-names>A. P.</given-names></name> <name><surname>Gu</surname> <given-names>W.</given-names></name> <name><surname>Castoe</surname> <given-names>T. A.</given-names></name> <name><surname>Batzer</surname> <given-names>M. A.</given-names></name> <name><surname>Pollock</surname> <given-names>D. D.</given-names></name></person-group> (<year>2011</year>). <article-title>Repetitive elements may comprise over two-thirds of the human genome</article-title>. <source>PLoS Genet.</source> <volume>7</volume>:<fpage>e1002384</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pgen.1002384</pub-id><pub-id pub-id-type="pmid">22144907</pub-id></citation>
</ref>
<ref id="B21">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Doucet-O&#x00027;Hare</surname> <given-names>T. T.</given-names></name> <name><surname>Rodic</surname> <given-names>N.</given-names></name> <name><surname>Sharma</surname> <given-names>R.</given-names></name> <name><surname>Darbari</surname> <given-names>I.</given-names></name> <name><surname>Abril</surname> <given-names>G.</given-names></name> <name><surname>Choi</surname> <given-names>J. A.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>LINE-1 expression and retrotransposition in Barrett&#x00027;s esophagus and esophageal carcinoma</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>112</volume>, <fpage>E4894</fpage>&#x02013;<lpage>E4900</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1502474112</pub-id><pub-id pub-id-type="pmid">26283398</pub-id></citation>
</ref>
<ref id="B22">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Doucet-O&#x00027;Hare</surname> <given-names>T. T.</given-names></name> <name><surname>Sharma</surname> <given-names>R.</given-names></name> <name><surname>Rodic</surname> <given-names>N.</given-names></name> <name><surname>Anders</surname> <given-names>R. A.</given-names></name> <name><surname>Burns</surname> <given-names>K. H.</given-names></name> <name><surname>Kazazian</surname> <given-names>H. H.</given-names> <suffix>Jr.</suffix></name></person-group> (<year>2016</year>). <article-title>Somatically Acquired LINE-1 Insertions in Normal Esophagus Undergo Clonal Expansion in Esophageal Squamous Cell Carcinoma</article-title>. <source>Hum. Mutat.</source> <volume>37</volume>, <fpage>942</fpage>&#x02013;<lpage>954</lpage>. <pub-id pub-id-type="doi">10.1002/humu.23027</pub-id><pub-id pub-id-type="pmid">27319353</pub-id></citation>
</ref>
<ref id="B23">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ewing</surname> <given-names>A. D.</given-names></name></person-group> (<year>2015</year>). <article-title>Transposable element detection from whole genome sequence data</article-title>. <source>Mob. DNA</source> <volume>6</volume>, <fpage>24</fpage>. <pub-id pub-id-type="doi">10.1186/s13100-015-0055-3</pub-id><pub-id pub-id-type="pmid">26719777</pub-id></citation>
</ref>
<ref id="B24">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ewing</surname> <given-names>A. D.</given-names></name> <name><surname>Gacita</surname> <given-names>A.</given-names></name> <name><surname>Wood</surname> <given-names>L. D.</given-names></name> <name><surname>Ma</surname> <given-names>F.</given-names></name> <name><surname>Xing</surname> <given-names>D.</given-names></name> <name><surname>Kim</surname> <given-names>M. S.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Widespread somatic L1 retrotransposition occurs early during gastrointestinal cancer evolution</article-title>. <source>Genome Res.</source> <volume>25</volume>, <fpage>1536</fpage>&#x02013;<lpage>1545</lpage>. <pub-id pub-id-type="doi">10.1101/gr.196238.115</pub-id><pub-id pub-id-type="pmid">26260970</pub-id></citation>
</ref>
<ref id="B25">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Forbes</surname> <given-names>S. A.</given-names></name> <name><surname>Beare</surname> <given-names>D.</given-names></name> <name><surname>Gunasekaran</surname> <given-names>P.</given-names></name> <name><surname>Leung</surname> <given-names>K.</given-names></name> <name><surname>Bindal</surname> <given-names>N.</given-names></name> <name><surname>Boutselakis</surname> <given-names>H.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>COSMIC: exploring the world&#x00027;s knowledge of somatic mutations in human cancer</article-title>. <source>Nucleic Acids Res.</source> <volume>43</volume>(Database issue), <fpage>D805</fpage>&#x02013;<lpage>D811</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gku1075</pub-id><pub-id pub-id-type="pmid">25355519</pub-id></citation>
</ref>
<ref id="B26">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Han</surname> <given-names>J. S.</given-names></name> <name><surname>Szak</surname> <given-names>S. T.</given-names></name> <name><surname>Boeke</surname> <given-names>J. D.</given-names></name></person-group> (<year>2004</year>). <article-title>Transcriptional disruption by the L1 retrotransposon and implications for mammalian transcriptomes</article-title>. <source>Nature</source> <volume>429</volume>, <fpage>268</fpage>&#x02013;<lpage>274</lpage>. <pub-id pub-id-type="doi">10.1038/nature02536</pub-id><pub-id pub-id-type="pmid">15152245</pub-id></citation>
</ref>
<ref id="B27">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hancks</surname> <given-names>D. C.</given-names></name> <name><surname>Kazazian</surname> <given-names>H. H.</given-names> <suffix>Jr.</suffix></name></person-group> (<year>2010</year>). <article-title>SVA retrotransposons: evolution and genetic instability</article-title>. <source>Semin. Cancer Biol.</source> <volume>20</volume>, <fpage>234</fpage>&#x02013;<lpage>245</lpage>. <pub-id pub-id-type="doi">10.1016/j.semcancer.2010.04.001</pub-id><pub-id pub-id-type="pmid">20416380</pub-id></citation>
</ref>
<ref id="B28">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hancks</surname> <given-names>D. C.</given-names></name> <name><surname>Kazazian</surname> <given-names>H. H.</given-names> <suffix>Jr.</suffix></name></person-group> (<year>2012</year>). <article-title>Active human retrotransposons: variation and disease</article-title>. <source>Curr. Opin. Genet. Dev.</source> <volume>22</volume>, <fpage>191</fpage>&#x02013;<lpage>203</lpage>. <pub-id pub-id-type="doi">10.1016/j.gde.2012.02.006</pub-id><pub-id pub-id-type="pmid">22406018</pub-id></citation>
</ref>
<ref id="B29">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Harris</surname> <given-names>C. R.</given-names></name> <name><surname>Normart</surname> <given-names>R.</given-names></name> <name><surname>Yang</surname> <given-names>Q.</given-names></name> <name><surname>Stevenson</surname> <given-names>E.</given-names></name> <name><surname>Haffty</surname> <given-names>B. G.</given-names></name> <name><surname>Ganesan</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>Association of nuclear localization of a long interspersed nuclear element-1 protein in breast tumors with poor prognostic outcomes</article-title>. <source>Genes Cancer</source> <volume>1</volume>, <fpage>115</fpage>&#x02013;<lpage>124</lpage>. <pub-id pub-id-type="doi">10.1177/1947601909360812</pub-id><pub-id pub-id-type="pmid">20948976</pub-id></citation>
</ref>
<ref id="B30">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Helman</surname> <given-names>E.</given-names></name> <name><surname>Lawrence</surname> <given-names>M. S.</given-names></name> <name><surname>Stewart</surname> <given-names>C.</given-names></name> <name><surname>Sougnez</surname> <given-names>C.</given-names></name> <name><surname>Getz</surname> <given-names>G.</given-names></name> <name><surname>Meyerson</surname> <given-names>M.</given-names></name></person-group> (<year>2014</year>). <article-title>Somatic retrotransposition in human cancer revealed by whole-genome and exome sequencing</article-title>. <source>Gen. Res.</source> <volume>24</volume>, <fpage>1053</fpage>&#x02013;<lpage>1063</lpage>. <pub-id pub-id-type="doi">10.1101/gr.163659.113</pub-id><pub-id pub-id-type="pmid">24823667</pub-id></citation>
</ref>
<ref id="B31">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Iskow</surname> <given-names>R. C.</given-names></name> <name><surname>McCabe</surname> <given-names>M. T.</given-names></name> <name><surname>Mills</surname> <given-names>R. E.</given-names></name> <name><surname>Torene</surname> <given-names>S.</given-names></name> <name><surname>Pittard</surname> <given-names>W. S.</given-names></name> <name><surname>Neuwald</surname> <given-names>A. F.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>Natural mutagenesis of human genomes by endogenous retrotransposons</article-title>. <source>Cell</source> <volume>141</volume>, <fpage>1253</fpage>&#x02013;<lpage>1261</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2010.05.020</pub-id><pub-id pub-id-type="pmid">20603005</pub-id></citation>
</ref>
<ref id="B32">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jin</surname> <given-names>Y.</given-names></name> <name><surname>Tam</surname> <given-names>O. H.</given-names></name> <name><surname>Paniagua</surname> <given-names>E.</given-names></name> <name><surname>Hammell</surname> <given-names>M.</given-names></name></person-group> (<year>2015</year>). <article-title>TEtranscripts: a package for including transposable elements in differential expression analysis of RNA-seq datasets</article-title>. <source>Bioinformatics</source> <volume>31</volume>, <fpage>3593</fpage>&#x02013;<lpage>3599</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btv422</pub-id><pub-id pub-id-type="pmid">26206304</pub-id></citation>
</ref>
<ref id="B33">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kazazian</surname> <given-names>H. H.</given-names> <suffix>Jr.</suffix></name> <name><surname>Wong</surname> <given-names>C.</given-names></name> <name><surname>Youssoufian</surname> <given-names>H.</given-names></name> <name><surname>Scott</surname> <given-names>A. F.</given-names></name> <name><surname>Phillips</surname> <given-names>D. G.</given-names></name> <name><surname>Antonarakis</surname> <given-names>S. E.</given-names></name></person-group> (<year>1988</year>). <article-title>Haemophilia A resulting from de novo insertion of L1 sequences represents a novel mechanism for mutation in man</article-title>. <source>Nature</source> <volume>332</volume>, <fpage>164</fpage>&#x02013;<lpage>166</lpage>. <pub-id pub-id-type="doi">10.1038/332164a0</pub-id><pub-id pub-id-type="pmid">2831458</pub-id></citation>
</ref>
<ref id="B34">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kemp</surname> <given-names>J. R.</given-names></name> <name><surname>Longworth</surname> <given-names>M. S.</given-names></name></person-group> (<year>2015</year>). <article-title>Crossing the LINE Toward Genomic Instability: LINE-1 Retrotransposition in Cancer</article-title>. <source>Front. Chem.</source> <volume>3</volume>:<fpage>68</fpage>. <pub-id pub-id-type="doi">10.3389/fchem.2015.00068</pub-id><pub-id pub-id-type="pmid">26734601</pub-id></citation>
</ref>
<ref id="B35">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lander</surname> <given-names>E. S.</given-names></name> <name><surname>Linton</surname> <given-names>L. M.</given-names></name> <name><surname>Birren</surname> <given-names>B.</given-names></name> <name><surname>Nusbaum</surname> <given-names>C.</given-names></name> <name><surname>Zody</surname> <given-names>M. C.</given-names></name> <name><surname>Baldwin</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2001</year>). <article-title>Initial sequencing and analysis of the human genome</article-title>. <source>Nature</source> <volume>409</volume>, <fpage>860</fpage>&#x02013;<lpage>921</lpage>. <pub-id pub-id-type="doi">10.1038/35057062</pub-id><pub-id pub-id-type="pmid">11237011</pub-id></citation>
</ref>
<ref id="B36">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname> <given-names>E.</given-names></name> <name><surname>Iskow</surname> <given-names>R.</given-names></name> <name><surname>Yang</surname> <given-names>L.</given-names></name> <name><surname>Gokcumen</surname> <given-names>O.</given-names></name> <name><surname>Haseley</surname> <given-names>P.</given-names></name> <name><surname>Luquette</surname> <given-names>L. J.</given-names> <suffix>III</suffix></name> <etal/></person-group>. (<year>2012</year>). <article-title>Landscape of somatic retrotransposition in human cancers</article-title>. <source>Science</source> <volume>337</volume>, <fpage>967</fpage>&#x02013;<lpage>971</lpage>. <pub-id pub-id-type="doi">10.1126/science.1222077</pub-id><pub-id pub-id-type="pmid">22745252</pub-id></citation>
</ref>
<ref id="B37">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Handsaker</surname> <given-names>B.</given-names></name> <name><surname>Wysoker</surname> <given-names>A.</given-names></name> <name><surname>Fennell</surname> <given-names>T.</given-names></name> <name><surname>Ruan</surname> <given-names>J.</given-names></name> <name><surname>Homer</surname> <given-names>N.</given-names></name> <etal/></person-group>. (<year>2009</year>). <article-title>The Sequence Alignment/Map format and SAMtools</article-title>. <source>Bioinformatics</source> <volume>25</volume>, <fpage>2078</fpage>&#x02013;<lpage>2079</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp352</pub-id><pub-id pub-id-type="pmid">19505943</pub-id></citation>
</ref>
<ref id="B38">
<citation citation-type="other"><person-group person-group-type="author"><name><surname>Maltbie</surname> <given-names>D.</given-names></name> <name><surname>Ganeshalingam</surname> <given-names>L.</given-names></name> <name><surname>Allen</surname> <given-names>P.</given-names></name></person-group> (<year>2013</year>). <source>System and Method for Secure, High-Speed Transfer of Very Large Files</source>. Google Patents.</citation>
</ref>
<ref id="B39">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Martinelli</surname> <given-names>S.</given-names></name> <name><surname>De Luca</surname> <given-names>A.</given-names></name> <name><surname>Stellacci</surname> <given-names>E.</given-names></name> <name><surname>Rossi</surname> <given-names>C.</given-names></name> <name><surname>Checquolo</surname> <given-names>S.</given-names></name> <name><surname>Lepri</surname> <given-names>F.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>Heterozygous germline mutations in the CBL tumor-suppressor gene cause a Noonan syndrome-like phenotype</article-title>. <source>Am. J. Hum. Genet.</source> <volume>87</volume>, <fpage>250</fpage>&#x02013;<lpage>257</lpage>. <pub-id pub-id-type="doi">10.1016/j.ajhg.2010.06.015</pub-id><pub-id pub-id-type="pmid">20619386</pub-id></citation>
</ref>
<ref id="B40">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Marx</surname> <given-names>V.</given-names></name></person-group> (<year>2014</year>). <article-title>Cancer genomes: discerning drivers from passengers</article-title>. <source>Nat. Methods</source> <volume>11</volume>, <fpage>375</fpage>&#x02013;<lpage>379</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.2891</pub-id></citation>
</ref>
<ref id="B41">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Miki</surname> <given-names>Y.</given-names></name> <name><surname>Nishisho</surname> <given-names>I.</given-names></name> <name><surname>Horii</surname> <given-names>A.</given-names></name> <name><surname>Miyoshi</surname> <given-names>Y.</given-names></name> <name><surname>Utsunomiya</surname> <given-names>J.</given-names></name> <name><surname>Kinzler</surname> <given-names>K. W.</given-names></name> <etal/></person-group>. (<year>1992</year>). <article-title>Disruption of the APC gene by a retrotransposal insertion of L1 sequence in a colon cancer</article-title>. <source>Cancer Res.</source> <volume>52</volume>, <fpage>643</fpage>&#x02013;<lpage>645</lpage>. <pub-id pub-id-type="pmid">1310068</pub-id></citation>
</ref>
<ref id="B42">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mills</surname> <given-names>R. E.</given-names></name> <name><surname>Bennett</surname> <given-names>E. A.</given-names></name> <name><surname>Iskow</surname> <given-names>R. C.</given-names></name> <name><surname>Devine</surname> <given-names>S. E.</given-names></name></person-group> (<year>2007</year>). <article-title>Which transposable elements are active in the human genome?</article-title> <source>Trends Genet.</source> <volume>23</volume>, <fpage>183</fpage>&#x02013;<lpage>191</lpage>. <pub-id pub-id-type="doi">10.1016/j.tig.2007.02.006</pub-id><pub-id pub-id-type="pmid">17331616</pub-id></citation>
</ref>
<ref id="B43">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Morita</surname> <given-names>K.</given-names></name> <name><surname>Masamoto</surname> <given-names>Y.</given-names></name> <name><surname>Kataoka</surname> <given-names>K.</given-names></name> <name><surname>Koya</surname> <given-names>J.</given-names></name> <name><surname>Kagoya</surname> <given-names>Y.</given-names></name> <name><surname>Yashiroda</surname> <given-names>H.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>BAALC potentiates oncogenic ERK pathway through interactions with MEKK1 and KLF4</article-title>. <source>Leukemia</source> <volume>29</volume>, <fpage>2248</fpage>&#x02013;<lpage>2256</lpage>. <pub-id pub-id-type="doi">10.1038/leu.2015.137</pub-id><pub-id pub-id-type="pmid">26050649</pub-id></citation>
</ref>
<ref id="B44">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Morse</surname> <given-names>B.</given-names></name> <name><surname>Rotherg</surname> <given-names>P. G.</given-names></name> <name><surname>South</surname> <given-names>V. J.</given-names></name> <name><surname>Spandorfer</surname> <given-names>J. M.</given-names></name> <name><surname>Astrin</surname> <given-names>S. M.</given-names></name></person-group> (<year>1988</year>). <article-title>Insertional mutagenesis of the myc locus by a LINE-1 sequence in a human breast carcinoma</article-title>. <source>Nature</source> <volume>333</volume>, <fpage>87</fpage>&#x02013;<lpage>90</lpage>. <pub-id pub-id-type="doi">10.1038/333087a0</pub-id><pub-id pub-id-type="pmid">2834650</pub-id></citation>
</ref>
<ref id="B45">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Naramura</surname> <given-names>M.</given-names></name> <name><surname>Nadeau</surname> <given-names>S.</given-names></name> <name><surname>Mohapatra</surname> <given-names>B.</given-names></name> <name><surname>Ahmad</surname> <given-names>G.</given-names></name> <name><surname>Mukhopadhyay</surname> <given-names>C.</given-names></name> <name><surname>Sattler</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>Mutant Cbl proteins as oncogenic drivers in myeloproliferative disorders</article-title>. <source>Oncotarget</source> <volume>2</volume>, <fpage>245</fpage>&#x02013;<lpage>250</lpage>. <pub-id pub-id-type="doi">10.18632/oncotarget.233</pub-id><pub-id pub-id-type="pmid">21422499</pub-id></citation>
</ref>
<ref id="B46">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ostertag</surname> <given-names>E. M.</given-names></name> <name><surname>Goodier</surname> <given-names>J. L.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name> <name><surname>Kazazian</surname> <given-names>H. H.</given-names> <suffix>Jr.</suffix></name></person-group> (<year>2003</year>). <article-title>SVA elements are nonautonomous retrotransposons that cause disease in humans</article-title>. <source>Am. J. Hum. Genet.</source> <volume>73</volume>, <fpage>1444</fpage>&#x02013;<lpage>1451</lpage>. <pub-id pub-id-type="doi">10.1086/380207</pub-id><pub-id pub-id-type="pmid">14628287</pub-id></citation>
</ref>
<ref id="B47">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Penzkofer</surname> <given-names>T.</given-names></name> <name><surname>Dandekar</surname> <given-names>T.</given-names></name> <name><surname>Zemojtel</surname> <given-names>T.</given-names></name></person-group> (<year>2005</year>). <article-title>L1Base: from functional annotation to prediction of active LINE-1 elements</article-title>. <source>Nucleic Acids Res.</source> <volume>33</volume>(<issue>Database issue</issue>), <fpage>D498</fpage>&#x02013;<lpage>D500</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gki044</pub-id><pub-id pub-id-type="pmid">15608246</pub-id></citation>
</ref>
<ref id="B48">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pon</surname> <given-names>J. R.</given-names></name> <name><surname>Marra</surname> <given-names>M. A.</given-names></name></person-group> (<year>2015</year>). <article-title>Driver and passenger mutations in cancer</article-title>. <source>Annu. Rev. Pathol.</source> <volume>10</volume>, <fpage>25</fpage>&#x02013;<lpage>50</lpage>. <pub-id pub-id-type="doi">10.1146/annurev-pathol-012414-040312</pub-id><pub-id pub-id-type="pmid">25340638</pub-id></citation>
</ref>
<ref id="B49">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pruitt</surname> <given-names>K. D.</given-names></name> <name><surname>Tatusova</surname> <given-names>T.</given-names></name> <name><surname>Brown</surname> <given-names>G. R.</given-names></name> <name><surname>Maglott</surname> <given-names>D. R.</given-names></name></person-group> (<year>2012</year>). <article-title>NCBI Reference Sequences (RefSeq): current status, new features and genome annotation policy</article-title>. <source>Nucleic Acids Res.</source> <volume>40</volume>(<issue>Database issue</issue>), <fpage>D130</fpage>&#x02013;<lpage>D135</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkr1079</pub-id><pub-id pub-id-type="pmid">22121212</pub-id></citation>
</ref>
<ref id="B50">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Quinlan</surname> <given-names>A. R.</given-names></name></person-group> (<year>2014</year>). <article-title>BEDTools: the Swiss-Army Tool for Genome Feature Analysis</article-title>. <source>Curr. Protoc. Bioinformatics</source> <volume>47</volume>, <fpage>11.12.1</fpage>&#x02013;<lpage>11.12.34</lpage>. <pub-id pub-id-type="doi">10.1002/0471250953.bi1112s47</pub-id><pub-id pub-id-type="pmid">25199790</pub-id></citation>
</ref>
<ref id="B51">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rangasamy</surname> <given-names>D.</given-names></name> <name><surname>Lenka</surname> <given-names>N.</given-names></name> <name><surname>Ohms</surname> <given-names>S.</given-names></name> <name><surname>Dahlstrom</surname> <given-names>J. E.</given-names></name> <name><surname>Blackburn</surname> <given-names>A. C.</given-names></name> <name><surname>Board</surname> <given-names>P. G.</given-names></name></person-group> (<year>2015</year>). <article-title>Activation of LINE-1 Retrotransposon Increases the Risk of Epithelial-Mesenchymal Transition and Metastasis in Epithelial Cancer</article-title>. <source>Curr. Mol. Med.</source> <volume>15</volume>, <fpage>588</fpage>&#x02013;<lpage>597</lpage>. <pub-id pub-id-type="doi">10.2174/1566524015666150831130827</pub-id><pub-id pub-id-type="pmid">26321759</pub-id></citation>
</ref>
<ref id="B52">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rishishwar</surname> <given-names>L.</given-names></name> <name><surname>Marino-Ramirez</surname> <given-names>L.</given-names></name> <name><surname>Jordan</surname> <given-names>I. K.</given-names></name></person-group> (<year>2016</year>). <article-title>Benchmarking computational tools for polymorphic transposable element detection</article-title>. <source>Brief. Bioinform.</source> [Epub ahead of print]. <pub-id pub-id-type="doi">10.1093/bib/bbw072</pub-id><pub-id pub-id-type="pmid">27524380</pub-id></citation>
</ref>
<ref id="B53">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rishishwar</surname> <given-names>L.</given-names></name> <name><surname>Tellez Villa</surname> <given-names>C. E.</given-names></name> <name><surname>Jordan</surname> <given-names>I. K.</given-names></name></person-group> (<year>2015</year>). <article-title>Transposable element polymorphisms recapitulate human evolution</article-title>. <source>Mob. DNA</source> <volume>6</volume>, <fpage>21</fpage>. <pub-id pub-id-type="doi">10.1186/s13100-015-0052-6</pub-id><pub-id pub-id-type="pmid">26579215</pub-id></citation>
</ref>
<ref id="B54">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Roadmap Epigenomics</surname> <given-names>C.</given-names></name> <name><surname>Kundaje</surname> <given-names>A.</given-names></name> <name><surname>Meuleman</surname> <given-names>W.</given-names></name> <name><surname>Ernst</surname> <given-names>J.</given-names></name> <name><surname>Bilenky</surname> <given-names>M.</given-names></name> <name><surname>Yen</surname> <given-names>A.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Integrative analysis of 111 reference human epigenomes</article-title>. <source>Nature</source> <volume>518</volume>, <fpage>317</fpage>&#x02013;<lpage>330</lpage>. <pub-id pub-id-type="doi">10.1038/nature14248</pub-id><pub-id pub-id-type="pmid">25693563</pub-id></citation>
</ref>
<ref id="B55">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rodic</surname> <given-names>N.</given-names></name> <name><surname>Sharma</surname> <given-names>R.</given-names></name> <name><surname>Sharma</surname> <given-names>R.</given-names></name> <name><surname>Zampella</surname> <given-names>J.</given-names></name> <name><surname>Dai</surname> <given-names>L.</given-names></name> <name><surname>Taylor</surname> <given-names>M. S.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Long interspersed element-1 protein expression is a hallmark of many human cancers</article-title>. <source>Am. J. Pathol.</source> <volume>184</volume>, <fpage>1280</fpage>&#x02013;<lpage>1286</lpage>. <pub-id pub-id-type="doi">10.1016/j.ajpath.2014.01.007</pub-id><pub-id pub-id-type="pmid">24607009</pub-id></citation>
</ref>
<ref id="B56">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schmidt</surname> <given-names>M. H.</given-names></name> <name><surname>Dikic</surname> <given-names>I.</given-names></name></person-group> (<year>2005</year>). <article-title>The Cbl interactome and its functions</article-title>. <source>Nat. Rev. Mol. Cell Biol.</source> <volume>6</volume>, <fpage>907</fpage>&#x02013;<lpage>918</lpage>. <pub-id pub-id-type="doi">10.1038/nrm1762</pub-id><pub-id pub-id-type="pmid">16227975</pub-id></citation>
</ref>
<ref id="B57">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Scott</surname> <given-names>E. C.</given-names></name> <name><surname>Gardner</surname> <given-names>E. J.</given-names></name> <name><surname>Masood</surname> <given-names>A.</given-names></name> <name><surname>Chuang</surname> <given-names>N. T.</given-names></name> <name><surname>Vertino</surname> <given-names>P. M.</given-names></name> <name><surname>Devine</surname> <given-names>S. E.</given-names></name></person-group> (<year>2016</year>). <article-title>A hot L1 retrotransposon evades somatic repression and initiates human colorectal cancer</article-title>. <source>Genome Res.</source> <volume>26</volume>, <fpage>745</fpage>&#x02013;<lpage>755</lpage>. <pub-id pub-id-type="doi">10.1101/gr.201814.115</pub-id><pub-id pub-id-type="pmid">27197217</pub-id></citation>
</ref>
<ref id="B58">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sever</surname> <given-names>R.</given-names></name> <name><surname>Brugge</surname> <given-names>J. S.</given-names></name></person-group> (<year>2015</year>). <article-title>Signal transduction in cancer</article-title>. <source>Cold Spring Harb. Perspect. Med.</source> <volume>5</volume>:<fpage>a006098</fpage>. <pub-id pub-id-type="doi">10.1101/cshperspect.a006098</pub-id><pub-id pub-id-type="pmid">25833940</pub-id></citation>
</ref>
<ref id="B59">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shukla</surname> <given-names>R.</given-names></name> <name><surname>Upton</surname> <given-names>K. R.</given-names></name> <name><surname>Mu&#x000F1;oz-Lopez</surname> <given-names>M.</given-names></name> <name><surname>Gerhardt</surname> <given-names>D. J.</given-names></name> <name><surname>Fisher</surname> <given-names>M. E.</given-names></name> <name><surname>Nguyen</surname> <given-names>T.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>Endogenous retrotransposition activates oncogenic pathways in hepatocellular carcinoma</article-title>. <source>Cell</source> <volume>153</volume>, <fpage>101</fpage>&#x02013;<lpage>111</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2013.02.032</pub-id><pub-id pub-id-type="pmid">23540693</pub-id></citation>
</ref>
<ref id="B60">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Solyom</surname> <given-names>S.</given-names></name> <name><surname>Ewing</surname> <given-names>A. D.</given-names></name> <name><surname>Rahrmann</surname> <given-names>E. P.</given-names></name> <name><surname>Doucet</surname> <given-names>T.</given-names></name> <name><surname>Nelson</surname> <given-names>H. H.</given-names></name> <name><surname>Burns</surname> <given-names>M. B.</given-names></name> <etal/></person-group>. (<year>2012</year>). <article-title>Extensive somatic L1 retrotransposition in colorectal tumors</article-title>. <source>Genome Res.</source> <volume>22</volume>, <fpage>2328</fpage>&#x02013;<lpage>2338</lpage>. <pub-id pub-id-type="doi">10.1101/gr.145235.112</pub-id><pub-id pub-id-type="pmid">22968929</pub-id></citation>
</ref>
<ref id="B61">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Solyom</surname> <given-names>S.</given-names></name> <name><surname>Kazazian</surname> <given-names>H. H.</given-names></name></person-group> (<year>2012</year>). <article-title>Mobile elements in the human genome: implications for disease</article-title>. <source>Genome Med.</source> <volume>4</volume>:<fpage>12</fpage>. <pub-id pub-id-type="doi">10.1186/gm311</pub-id><pub-id pub-id-type="pmid">22364178</pub-id></citation>
</ref>
<ref id="B62">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stratton</surname> <given-names>M. R.</given-names></name> <name><surname>Campbell</surname> <given-names>P. J.</given-names></name> <name><surname>Futreal</surname> <given-names>P. A.</given-names></name></person-group> (<year>2009</year>). <article-title>The cancer genome</article-title>. <source>Nature</source> <volume>458</volume>, <fpage>719</fpage>&#x02013;<lpage>724</lpage>. <pub-id pub-id-type="doi">10.1038/nature07943</pub-id><pub-id pub-id-type="pmid">19360079</pub-id></citation>
</ref>
<ref id="B63">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sudmant</surname> <given-names>P. H.</given-names></name> <name><surname>Rausch</surname> <given-names>T.</given-names></name> <name><surname>Gardner</surname> <given-names>E. J.</given-names></name> <name><surname>Handsaker</surname> <given-names>R. E.</given-names></name> <name><surname>Abyzov</surname> <given-names>A.</given-names></name> <name><surname>Huddleston</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>An integrated map of structural variation in 2,504 human genomes</article-title>. <source>Nature</source> <volume>526</volume>, <fpage>75</fpage>&#x02013;<lpage>81</lpage>. <pub-id pub-id-type="doi">10.1038/nature15394</pub-id><pub-id pub-id-type="pmid">26432246</pub-id></citation>
</ref>
<ref id="B64">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Thung</surname> <given-names>D. T.</given-names></name> <name><surname>de Ligt</surname> <given-names>J.</given-names></name> <name><surname>Vissers</surname> <given-names>L. E.</given-names></name> <name><surname>Steehouwer</surname> <given-names>M.</given-names></name> <name><surname>Kroon</surname> <given-names>M.</given-names></name> <name><surname>de Vries</surname> <given-names>P.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Mobster: accurate detection of mobile element insertions in next generation sequencing data</article-title>. <source>Genome Biol.</source> <volume>15</volume>:<fpage>488</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-014-0488-x</pub-id><pub-id pub-id-type="pmid">25348035</pub-id></citation>
</ref>
<ref id="B65">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Trapnell</surname> <given-names>C.</given-names></name> <name><surname>Williams</surname> <given-names>B. A.</given-names></name> <name><surname>Pertea</surname> <given-names>G.</given-names></name> <name><surname>Mortazavi</surname> <given-names>A.</given-names></name> <name><surname>Kwan</surname> <given-names>G.</given-names></name> <name><surname>van Baren</surname> <given-names>M. J.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>Transcript assembly and quantification by RNA-Seq reveals unannotated transcripts and isoform switching during cell differentiation</article-title>. <source>Nat. Biotechnol.</source> <volume>28</volume>, <fpage>511</fpage>&#x02013;<lpage>515</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.1621</pub-id><pub-id pub-id-type="pmid">20436464</pub-id></citation>
</ref>
<ref id="B66">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tubio</surname> <given-names>J. M.</given-names></name> <name><surname>Li</surname> <given-names>Y.</given-names></name> <name><surname>Ju</surname> <given-names>Y. S.</given-names></name> <name><surname>Martincorena</surname> <given-names>I.</given-names></name> <name><surname>Cooke</surname> <given-names>S. L.</given-names></name> <name><surname>Tojo</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Mobile DNA in cancer. Extensive transduction of nonrepetitive DNA mediated by L1 retrotransposition in cancer genomes</article-title>. <source>Science</source> <volume>345</volume>:<fpage>1251343</fpage>. <pub-id pub-id-type="doi">10.1126/science.1251343</pub-id><pub-id pub-id-type="pmid">25082706</pub-id></citation>
</ref>
<ref id="B67">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Van der Auwera</surname> <given-names>G. A.</given-names></name> <name><surname>Carneiro</surname> <given-names>M. O.</given-names></name> <name><surname>Hartl</surname> <given-names>C.</given-names></name> <name><surname>Poplin</surname> <given-names>R.</given-names></name> <name><surname>Del Angel</surname> <given-names>G.</given-names></name> <name><surname>Levy-Moonshine</surname> <given-names>A.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>From FastQ data to high confidence variant calls: the Genome Analysis Toolkit best practices pipeline</article-title>. <source>Curr. Protoc. Bioinformatics</source> <volume>43</volume>, 11 10 <fpage>11</fpage>&#x02013;<lpage>33</lpage>. <pub-id pub-id-type="doi">10.1002/0471250953.bi1110s43</pub-id><pub-id pub-id-type="pmid">25431634</pub-id></citation>
</ref>
<ref id="B68">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>H.</given-names></name> <name><surname>Xing</surname> <given-names>J.</given-names></name> <name><surname>Grover</surname> <given-names>D.</given-names></name> <name><surname>Hedges</surname> <given-names>D. J.</given-names></name> <name><surname>Han</surname> <given-names>K.</given-names></name> <name><surname>Walker</surname> <given-names>J. A.</given-names></name> <etal/></person-group>. (<year>2005</year>). <article-title>SVA elements: a hominid-specific retroposon family</article-title>. <source>J. Mol. Biol.</source> <volume>354</volume>, <fpage>994</fpage>&#x02013;<lpage>1007</lpage>. <pub-id pub-id-type="doi">10.1016/j.jmb.2005.09.085</pub-id><pub-id pub-id-type="pmid">16288912</pub-id></citation>
</ref>
<ref id="B69">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Weinstein</surname> <given-names>J. N.</given-names></name> <name><surname>Collisson</surname> <given-names>E. A.</given-names></name> <name><surname>Mills</surname> <given-names>G. B.</given-names></name> <name><surname>Shaw</surname> <given-names>K. M.</given-names></name> <name><surname>Ozenberger</surname> <given-names>B. A.</given-names></name> <name><surname>Ellrott</surname> <given-names>K.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>The Cancer Genome Atlas Pan-Cancer analysis project</article-title>. <source>Nat. Genet.</source> <volume>45</volume>, <fpage>1113</fpage>&#x02013;<lpage>1120</lpage>. <pub-id pub-id-type="doi">10.1038/ng.2764</pub-id><pub-id pub-id-type="pmid">24071849</pub-id></citation>
</ref>
<ref id="B70">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wildschutte</surname> <given-names>J. H.</given-names></name> <name><surname>Williams</surname> <given-names>Z. H.</given-names></name> <name><surname>Montesion</surname> <given-names>M.</given-names></name> <name><surname>Subramanian</surname> <given-names>R. P.</given-names></name> <name><surname>Kidd</surname> <given-names>J. M.</given-names></name> <name><surname>Coffin</surname> <given-names>J. M.</given-names></name></person-group> (<year>2016</year>). <article-title>Discovery of unfixed endogenous retrovirus insertions in diverse human populations</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>113</volume>, <fpage>E2326</fpage>&#x02013;<lpage>E2334</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1602336113</pub-id><pub-id pub-id-type="pmid">27001843</pub-id></citation>
</ref>
<ref id="B71">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhou</surname> <given-names>J. D.</given-names></name> <name><surname>Yang</surname> <given-names>L.</given-names></name> <name><surname>Zhang</surname> <given-names>Y. Y.</given-names></name> <name><surname>Yang</surname> <given-names>J.</given-names></name> <name><surname>Wen</surname> <given-names>X. M.</given-names></name> <name><surname>Guo</surname> <given-names>H.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Overexpression of BAALC: clinical significance in Chinese de novo acute myeloid leukemia</article-title>. <source>Med. Oncol.</source> <volume>32</volume>:<fpage>386</fpage>. <pub-id pub-id-type="doi">10.1007/s12032-014-0386-9</pub-id><pub-id pub-id-type="pmid">25428390</pub-id></citation>
</ref>
</ref-list>
</back>
</article>