<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Toxicology</journal-id>
<journal-title>Frontiers in Toxicology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Toxicol.</abbrev-journal-title>
<issn pub-type="epub">2673-3080</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">846221</article-id>
<article-id pub-id-type="doi">10.3389/ftox.2022.846221</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Toxicology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Leveraging a High-Throughput Screening Method to Identify Mechanisms of Individual Susceptibility Differences in a Genetically Diverse Zebrafish Model</article-title>
<alt-title alt-title-type="left-running-head">Wallis et al.</alt-title>
<alt-title alt-title-type="right-running-head">Mechanistic Validation of High-Throughput Signals</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Wallis</surname>
<given-names>Dylan J.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1616761/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>La Du</surname>
<given-names>Jane</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Thunga</surname>
<given-names>Preethi</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1239877/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Elson</surname>
<given-names>Daniel</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1621288/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Truong</surname>
<given-names>Lisa</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1682921/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Kolluri</surname>
<given-names>Siva K.</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/938415/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Tanguay</surname>
<given-names>Robyn L.</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/40352/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Reif</surname>
<given-names>David M.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/275221/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Bioinformatics Research Center</institution>, <institution>Department of Biological Sciences</institution>, <institution>North Carolina State University</institution>, <addr-line>Raleigh</addr-line>, <addr-line>NC</addr-line>, <country>United States</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Sinnhuber Aquatic Research Laboratory</institution>, <institution>Department of Environmental and Molecular Toxicology</institution>, <institution>Oregon State University</institution>, <addr-line>Corvallis</addr-line>, <addr-line>OR</addr-line>, <country>United States</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Cancer Research Laboratory</institution>, <institution>Department of Environmental and Molecular Toxicology</institution>, <institution>Oregon State University</institution>, <addr-line>Corvallis</addr-line>, <addr-line>OR</addr-line>, <country>United States</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/153766/overview">Michael J. Carvan</ext-link>, University of Wisconsin&#x2013;Milwaukee, United States</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2957/overview">Robert Gerlai</ext-link>, University of Toronto, Canada</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/37976/overview">Scott Auerbach</ext-link>, National Institute of Environmental Health Sciences (NIH), United States</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: David M. Reif, <email>dmreif@ncsu.edu</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Toxicogenomics, a section of the journal Frontiers in Toxicology</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>29</day>
<month>04</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>4</volume>
<elocation-id>846221</elocation-id>
<history>
<date date-type="received">
<day>30</day>
<month>12</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>14</day>
<month>03</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 Wallis, La Du, Thunga, Elson, Truong, Kolluri, Tanguay and Reif.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Wallis, La Du, Thunga, Elson, Truong, Kolluri, Tanguay and Reif</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Understanding the mechanisms behind chemical susceptibility differences is key to protecting sensitive populations. However, elucidating gene-environment interactions (GxE) presents a daunting challenge. While mammalian models have proven useful, problems with scalability to an enormous chemical exposome and clinical translation faced by all models remain; therefore, alternatives are needed. Zebrafish (<italic>Danio rerio</italic>) have emerged as an excellent model for investigating GxE. This study used a combined bioinformatic and experimental approach to probe the mechanisms underlying chemical susceptibility differences in a genetically diverse zebrafish population. Starting from high-throughput screening (HTS) data, a genome-wide association study (GWAS) using embryonic fish exposed to 0.6&#xa0;&#x3bc;M Abamectin revealed significantly different effects between individuals. A hypervariable region with two distinct alleles&#x2013;one with G at the SNP locus (GG) and one with a T and the 16&#xa0;bp deletion (TT)&#x2013;associated with differential susceptibility was found. Sensitive fish had significantly lower <italic>sox7</italic> expression. Due to their location and the observed expression differences, we hypothesized that these sequences differentially regulate <italic>sox7.</italic> A luciferase reporter gene assay was used to test if these sequences, alone, could lead to expression differences. The TT allele showed significantly lower expression than the GG allele in MCF-7 cells. To better understand the mechanism behind these expression differences, predicted transcription factor binding differences between individuals were compared <italic>in silico</italic>, and several putative binding differences were identified. EMSA was used to test for binding differences in whole embryo protein lysate to investigate these TF binding predictions. We confirmed that the GG sequence is bound to protein in zebrafish. Through a competition EMSA using an untagged oligo titration, we confirmed that the GG oligo had a higher binding affinity than the TT oligo, explaining the observed expression differences. This study identified differential susceptibility to chemical exposure in a genetically diverse population, then identified a plausible mechanism behind those differences from a genetic to molecular level. Thus, an HTS-compatible zebrafish model is valuable and adaptable in identifying GxE mechanisms behind susceptibility differences to chemical exposure.</p>
</abstract>
<kwd-group>
<kwd>high-throughput (HT) approaches</kwd>
<kwd>zebrafish</kwd>
<kwd>computational toxicology</kwd>
<kwd>mechanism</kwd>
<kwd>genomic</kwd>
<kwd>abamectin</kwd>
<kwd>pathways</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Population-wide differences in susceptibility to chemical exposures exert significant impacts in medicine and risk assessment (<xref ref-type="bibr" rid="B32">Suter et al., 2004</xref>; <xref ref-type="bibr" rid="B30">Roden et al., 2011</xref>; <xref ref-type="bibr" rid="B12">Gamazon and Perera, 2012</xref>; <xref ref-type="bibr" rid="B23">Motsinger-Reif et al., 2013</xref>). Identifying compounds that have vast differences in individual susceptibility across a genetically diverse population has important implications for how we prescribe drugs to treat disease, deal with environmental exposures, and regulate chemical producers (<xref ref-type="bibr" rid="B32">Suter et al., 2004</xref>; <xref ref-type="bibr" rid="B27">Qin et al., 2016</xref>). As of 2013 there were over 80,000 chemicals registered with the EPA that people could be exposed to (<xref ref-type="bibr" rid="B33">United States, 1986</xref>; <xref ref-type="bibr" rid="B4">Bergeson, 2000</xref>; <xref ref-type="bibr" rid="B17">Kinch et al., 2014</xref>). Yet, the mechanisms that lead to population-level variation in susceptibility remain poorly understood (<xref ref-type="bibr" rid="B39">Zhou et al., 2017</xref>; <xref ref-type="bibr" rid="B15">Jerry et al., 2018</xref>).</p>
<p>The National Research Council (NRC) stated in their document on the future of risk assessment, &#x201c;Science and Decisions&#x201d;, that susceptibility differences across different chemicals required more attention (<xref ref-type="bibr" rid="B24">National Research Council, 2009</xref>). In 2016, the Frank R. Lautenberg act amended The Toxic Substances Control Act (TSCA) to include the consideration of susceptible populations in risk assessment (<xref ref-type="bibr" rid="B33">United States, 1986</xref>; <xref ref-type="bibr" rid="B22">Mortensen and Euling, 2013</xref>; <xref ref-type="bibr" rid="B21">Mortensen et al., 2018</xref>). This cemented the importance of understanding the variables that can lead to differences in susceptibility in a population to diseases caused by chemical exposure.</p>
<p>Unfortunately, the study of how genetic differences and gene-environment interactions (GxE) can affect (sub)population response to an exposure is challenging for several reasons: Sample sizes of sufficient power are hard to achieve; Mechanisms are hard to parse out, Environmental variables are hard to control and separate; and Relating an exposure to a specific phenotype is challenging (<xref ref-type="bibr" rid="B18">Le Marchand and Wilkens, 2008</xref>; <xref ref-type="bibr" rid="B11">Freedman et al., 2011</xref>; <xref ref-type="bibr" rid="B19">McAllister et al., 2017</xref>; <xref ref-type="bibr" rid="B39">Zhou et al., 2017</xref>). Current knowledge says that regulatory variation in genes may be the primary cause of phenotypic differences in humans (<xref ref-type="bibr" rid="B22">Mortensen and Euling, 2013</xref>). These regions are harder to disentangle to gain an understanding of their effect on susceptibility. In addition to this, while new approach methodologies (NAMs) can identify chemicals with the potential to elicit clinically observable adverse effects, comprehensive risk assessment is hampered by differential susceptibility across exposed individuals. In past studies, animal models have been used to identify and implicate specific genes that lead to susceptibility to different diseases in humans (<xref ref-type="bibr" rid="B22">Mortensen and Euling, 2013</xref>; <xref ref-type="bibr" rid="B21">Mortensen et al., 2018</xref>). Current risk assessment methods use uncertainty factors when calculating acceptable exposure levels to approximate differences between susceptible and resistant populations (<xref ref-type="bibr" rid="B22">Mortensen and Euling, 2013</xref>; <xref ref-type="bibr" rid="B21">Mortensen et al., 2018</xref>).</p>
<p>Zebrafish (<italic>Danio rerio</italic>) have emerged as an excellent model of human disease that are well suited for high-throughput <italic>in vivo</italic> assays: They produce a large number of offspring; They have phenotypes that can easily be compared to human diseases; Their embryos are transparent and develop <italic>ex vivo</italic>; Phenotypes can be assessed as early as 24&#xa0;h after fertilization; And they can be separated into wells to be exposed individually to allow for a highly controlled environment (<xref ref-type="bibr" rid="B35">Truong et al., 2011</xref>; <xref ref-type="bibr" rid="B36">Truong et al., 2014</xref>; <xref ref-type="bibr" rid="B14">Garcia et al., 2016</xref>; <xref ref-type="bibr" rid="B34">Truong et al., 2016</xref>; <xref ref-type="bibr" rid="B2">Balik-Meisner et al., 2018a</xref>). Chemical testing using zebrafish provides phenotypic responses that can reveal the etiology of many adverse outcomes (<xref ref-type="bibr" rid="B35">Truong et al., 2011</xref>; <xref ref-type="bibr" rid="B36">Truong et al., 2014</xref>; <xref ref-type="bibr" rid="B14">Garcia et al., 2016</xref>; <xref ref-type="bibr" rid="B29">Reif et al., 2016</xref>; <xref ref-type="bibr" rid="B34">Truong et al., 2016</xref>; <xref ref-type="bibr" rid="B38">Zhang et al., 2017</xref>; <xref ref-type="bibr" rid="B2">Balik-Meisner et al., 2018a</xref>; <xref ref-type="bibr" rid="B13">Garcia et al., 2018</xref>). Zebrafish are also the only vertebrate model that can be assayed in a high throughput manner at the phylotypic stage of development that is most similar to vertebrate early development (<xref ref-type="bibr" rid="B14">Garcia et al., 2016</xref>). Unlike an <italic>in vitro</italic> system or another <italic>in vivo</italic> vertebrate system, zebrafish can reveal the mechanisms of complex phenotypic responses to chemicals in a high-throughput and cost-effective manner (<xref ref-type="bibr" rid="B35">Truong et al., 2011</xref>; <xref ref-type="bibr" rid="B36">Truong et al., 2014</xref>; <xref ref-type="bibr" rid="B14">Garcia et al., 2016</xref>; <xref ref-type="bibr" rid="B34">Truong et al., 2016</xref>; <xref ref-type="bibr" rid="B2">Balik-Meisner et al., 2018a</xref>). The T5D zebrafish line used here is an outbred zebrafish line that mimics human genetic diversity and acts as an excellent proxy for assessing differential susceptibility to many different chemicals (<xref ref-type="bibr" rid="B2">Balik-Meisner et al., 2018a</xref>; <xref ref-type="bibr" rid="B3">Balik-Meisner et al., 2018b</xref>). A study on the genetic diversity of T5D zebrafish found 10.3&#x2013;20.1&#xa0;M SNPs and 2.8&#x2013;5.6&#xa0;M indels across the population (<xref ref-type="bibr" rid="B2">Balik-Meisner et al., 2018a</xref>; <xref ref-type="bibr" rid="B3">Balik-Meisner et al., 2018b</xref>). As a comparison, the 1,000 genome project found that humans had 84.7&#xa0;M SNP, 3.6&#xa0;M short indels (The 1000 Genomes Project Consortium et al., 2015).</p>
<p>This study acts as a proof of concept that HTS for developmental effects of exposure to a large array of chemicals can identify those associated with GxE that elicit differences in individual susceptibility across the genetically diverse T5D zebrafish line (<xref ref-type="bibr" rid="B35">Truong et al., 2011</xref>; <xref ref-type="bibr" rid="B36">Truong et al., 2014</xref>; <xref ref-type="bibr" rid="B34">Truong et al., 2016</xref>; <xref ref-type="bibr" rid="B2">Balik-Meisner et al., 2018a</xref>). The data in this study uses information gained from a screening of 1078 EPA ToxCast phase 1 and 2 chemicals (<xref ref-type="bibr" rid="B35">Truong et al., 2011</xref>; <xref ref-type="bibr" rid="B36">Truong et al., 2014</xref>; <xref ref-type="bibr" rid="B34">Truong et al., 2016</xref>; <xref ref-type="bibr" rid="B2">Balik-Meisner et al., 2018a</xref>). Several chemicals, including abamectin, showed substantial differences in developmental effects across zebrafish, suggesting that underlying genetic variation may play a role in exposure-response. Abamectin, an agricultural insecticide that has been associated with neurotoxicity, developmental effects, and endocrine disruption according to a risk assessment by the European Food Safety Authority (<xref ref-type="bibr" rid="B1">Anastassiadou et al., 2020</xref>), was selected for further investigation due to robust population susceptibility differences across multiple rounds of rangefinder experiments. In a genome-wide association study (GWAS) of developmental exposure to Abamectin, multiple single-nucleotide polymorphisms (SNPs) were discovered that were associated with differential effects (<xref ref-type="bibr" rid="B2">Balik-Meisner et al., 2018a</xref>). Some of these SNPs were located upstream of the SRY-Box Transcription Factor 7 (<italic>sox7</italic>) gene. Human SOX7 plays several important roles in development including cell differentiation, regulation between cell proliferation and differentiation, lineage determination, regulation of angiogenesis and vasculogenesis, and also acts as a tumor suppressor (<xref ref-type="bibr" rid="B31">Stovall et al., 2014</xref>). Zebrafish Sox7 is orthologous to human SOX7 and is predicted to play a similar role in producing a DNA-binding transcription factor that helps to guide development (<xref ref-type="bibr" rid="B37">Zfin Gene, 2021</xref>).</p>
<p>When interrogated using real-time polymerase chain reaction (real-time PCR) <italic>sox7</italic> exhibited significant expression differences between fish that were sensitive to abamectin expression (&#x201c;affected&#x201d;) and fish that were not (&#x201c;unaffected&#x201d;) (<xref ref-type="bibr" rid="B2">Balik-Meisner et al., 2018a</xref>). This led to the hypothesis that susceptibility to abamectin was affected by regulation of <italic>sox7.</italic> Here, we describe a discovery path (<xref ref-type="fig" rid="F1">Figure 1</xref>) of bioinformatically-guided experimentation to test our hypothesis that genetic variation influences population responses to environmental exposure (GxE). As part of the broader approach, this study aimed to validate a plausible mechanism behind HTS-scale patterns of differential response down to a detailed molecular and genetic level.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>This figure illustrates the experimental flow of this study which could be tailored or branched, based on the progression of biochemical and wet-lab experiments, to apply it to similar studies. Bioinformatic approaches were used to generate hypotheses which were then tested <italic>via</italic> biochemical experimentation. A high-throughput GWAS experiment followed by a more <italic>in-depth</italic> analysis of a single genetic region was followed-up with RT-PCR to test if <italic>sox7</italic> expression differed in the affected an unaffected fish. This was then followed up by <italic>in silico</italic> analysis of the region to identify possible TF binding differences. The results of that comparison were confirmed with EMSA to test for differences in binding affinities across the variants and their ability to cause differential expression was probed with a luciferase assay.</p>
</caption>
<graphic xlink:href="ftox-04-846221-g001.tif"/>
</fig>
</sec>
<sec id="s2">
<title>2 Materials and Methods</title>
<sec id="s2-1">
<title>2.1 Experimental Overview</title>
<p>A high-throughput screening (HTS), genome-wide association study (GWAS) was performed to identify loci that were associated with individual differences in susceptibility across an outbred zebrafish population as described in <xref ref-type="bibr" rid="B2">Balik-Meisner et al. (2018a)</xref>. Briefly, the study leveraged data from thousands of chemicals, as well as a method that quantified morphological effects of developmental exposure in an outbred zebrafish population to identify chemicals that showed high variability in effect across the population (<xref ref-type="bibr" rid="B38">Zhang et al., 2017</xref>; <xref ref-type="bibr" rid="B2">Balik-Meisner et al., 2018a</xref>). Abamectin was chosen from these high-variance chemicals. After identifying a critical concentration, larval zebrafish were exposed (<xref ref-type="bibr" rid="B2">Balik-Meisner et al., 2018a</xref>). Affected and unaffected zebrafish larvae were collected and their DNA was individually sequenced to identify loci associated with susceptibility (<xref ref-type="bibr" rid="B2">Balik-Meisner et al., 2018a</xref>). This study identified significant expression differences in <italic>sox7</italic> between affected and unaffected zebrafish using PCR (<xref ref-type="bibr" rid="B2">Balik-Meisner et al., 2018a</xref>). A combined bioinformatic and biochemical approach was used to validate the results from the previous study and identify the mechanism that leads to susceptibility differences. Transcription factor binding site (TFBS) prediction was used to identify putative transcription factor binding differences between individual fish. Following the TFBS prediction analysis, an electrophoretic mobility shift assay (EMSA) was used to assess binding between these sequences and proteins in zebrafish nuclear protein extract. A luciferase assay was then used to measure expression differences between the two presumed regulatory regions.</p>
</sec>
<sec id="s2-2">
<title>2.2 Zebrafish Model</title>
<p>Tropical 5D (T5D) wild type zebrafish were housed at Sinnhuber Aquatic Research Laboratory at Oregon State University, in a density of approximately 1,000 fish per 100-gallon tank. Tank water consisting of reverse osmosis water supplemented with Instant Ocean&#x2122; salts were kept at standard laboratory conditions of 28&#xb0;C on a 14-h light/10-h dark photoperiod. The water was at a salinity of 600&#xa0;&#x3bc;S and maintained at a pH of 7.4 (<xref ref-type="bibr" rid="B40">Mandrell et al., 2012</xref>; <xref ref-type="bibr" rid="B41">Barton et al., 2016</xref>). Mass spawning funnels were placed into the tanks the night prior, and the following morning embryos were collected, staged and cleaned (<xref ref-type="bibr" rid="B16">Kimmel et al., 1995</xref>). T5D zebrafish originated from 25 small group crosses containing three males and three females imported from a breeding facility. Following generations have been bred with equal proportions of offspring from a minimum of 25 small group crosses, each group containing three males and up to three females (<xref ref-type="bibr" rid="B3">Balik-Meisner et al., 2018b</xref>). For more details on the genetic diversity of the T5D line please see <xref ref-type="bibr" rid="B3">Balik-Meisner et al. (2018b)</xref>. Zebrafish embryos were obtained <italic>via</italic> group spawning and were dechorionated after collection and placed in 96 well plates as detailed in multiple papers by <xref ref-type="bibr" rid="B35">Truong et al. (2011)</xref> and <xref ref-type="bibr" rid="B36">Truong et al. (2014)</xref>. The T5D zebrafish line was used for all zebrafish experiments in this study.</p>
</sec>
<sec id="s2-3">
<title>2.3 Deep Reanalysis</title>
<p>The preliminary study identified a putative hyper-variable region upstream of <italic>sox7</italic> that was associated with susceptibility on chromosome 20. In order to identify loci that were associated with susceptibility within this region a secondary analysis of chromosome 20 was done. Paired end reads from the previous HT sequencing were trimmed with trimmomatic version 0.39 using the following parameters: ILLUMINACLIP:TruSeq3-PE.fa:2:30:10, LEADING:3, TRAILING:3, SLIDINGWINDOW:4:15, and MINLEN:36 (<xref ref-type="bibr" rid="B5">Bolger et al., 2014</xref>). Quality control was done on the sequences using fastqc to ensure the quality of the sequences for further analysis (<xref ref-type="bibr" rid="B10">Ewels et al., 2016</xref>). Sequences were aligned using the software package Burrows-Wheeler Aligner (BWA-MEM) with standard parameters (<xref ref-type="bibr" rid="B6">bwa.1, 2021</xref>).</p>
<p>Sam files were converted to bam files using the software package samtools (samtools). The bam files were sorted, indexed, and duplicates were marked using the software package picard prior to analysis (<xref ref-type="bibr" rid="B25">Picard Tools - By Broad Institute, 2021</xref>). Joint genotyping was done using GenomeAnalysisToolkit (GATK) HaplotypeCaller and gvcf files were merged using GATK CombineGVCFs (<xref ref-type="bibr" rid="B20">McKenna et al., 2010</xref>; <xref ref-type="bibr" rid="B9">DePristo et al., 2011</xref>). After variants were called, GATK VariantFiltration was used to filter out SNPs with the parameters: QualByDepth (QD) &#x3c; 2, FisherStrand (FS) &#x3e; 60, RMSMappingQuality (MQ) &#x3c; 40, MQRankSum &#x3c; &#x2212;12.5, and ReadPosRankSum &#x3c; &#x2212;8; as well as indels with QD &#x3c; 2, FS &#x3e; 200.0, and ReadPosRankSum &#x3c; &#x2212;20 (<xref ref-type="bibr" rid="B9">DePristo et al., 2011</xref>). Finally, association testing was done in PLINK version 1.9 using Fisher&#x2019;s exact test with a Bonferroni correction to correct for multiple testing (<xref ref-type="bibr" rid="B26">Purcell et al., 2007</xref>).</p>
</sec>
<sec id="s2-4">
<title>2.4 Transcription Factor Binding Site Prediction</title>
<sec id="s2-4-1">
<title>2.4.1 Software</title>
<p>MatInspector, an online program, was used to analyze the sequences upstream of <italic>sox7</italic> for each individual fish. MatInspector uses information on core sequences and nucleotide data on a number of transcription factors to generate a list of putative transcription factor binding sites, scored for goodness of fit using a scoring algorithm. For a more <italic>in-depth</italic> explanation of MatInspector see <xref ref-type="bibr" rid="B7">Cartharius et al. (2005)</xref> or the Genomatix website (<xref ref-type="bibr" rid="B7">Cartharius et al., 2005</xref>). A core similarity score of 0.75 was used to filter out unlikely matches.</p>
</sec>
<sec id="s2-4-2">
<title>2.4.2 Binding Site Curation</title>
<p>Differences between sequences with G or T at the primary SNP loci were compared using a chi-squared test to identify significant differences using the observed number of each predicted binding site across both genotypes. The test was done using the chisq.test command from the R package stats version 3.6.3 (<xref ref-type="bibr" rid="B28">R Core Team, 2020</xref>). This list of putative TFBSs were then curated manually by selecting transcription factors with homologues in zebrafish and sites that were within the 44&#xa0;bp area between the beginning of the Indel and the SNP.</p>
</sec>
</sec>
<sec id="s2-5">
<title>2.5 Luciferase Assay</title>
<sec id="s2-5-1">
<title>2.5.1 Assay</title>
<p>Double stranded oligos corresponding to the region &#x2212;900 to &#x2b;29&#xa0;bp of <italic>Sox7</italic>-201 variant TSS were synthesized and cloned in to pUCIDT vectors by IDT. Additional recognition sequence for restriction enzymes NheI and XhoI were added to ends for cloning into the minimal promoter pGL4.23 [<italic>luc2/minP</italic>] vector (Promega, E8411) for the luciferase assay. Sequences from positive clones were verified by Sanger sequencing at the Oregon State University Center for Genome Research and Biocomputing Core. Plasmids were purified with ZymoPURE Plasmid Miniprep Kit (Zymo Research).</p>
<p>MCF7 cells were seeded in a 24-well plate in 10% serum Dulbecco&#x2019;s Modified Eagle Medium (DMEM). The cells were transfected the following morning with the TT sequence, GG sequence, or vector control reporters as well as a &#x3b2;-galactose (&#x3b2;-gal) plasmid using 300&#xa0;ng reporter, 200&#xa0;ng &#x3b2;-gal, and 2&#xa0;&#x3bc;L lipofectamine per well. The sequences inserted into the vector are given below, annotated as: restriction enzyme sites underlined; transcription start site (TSS) in bold.</p>
<p>GG sequence: GCT&#x200b;AGCACA&#x200b;TAA&#x200b;ATC&#x200b;CAA&#x200b;TTC&#x200b;ATT&#x200b;TAG&#x200b;CGA&#x200b;AAA&#x200b;TAT&#x200b;TTA&#x200b;TTT&#x200b;TTA&#x200b;CGA&#x200b;TAT&#x200b;TTA&#x200b;TGA&#x200b;ATT&#x200b;GCG&#x200b;AAT&#x200b;TGT&#x200b;GTG&#x200b;TTG&#x200b;TAT&#x200b;TTA&#x200b;TGA&#x200b;GTT&#x200b;GTG&#x200b;TTT&#x200b;TGC&#x200b;ATT&#x200b;TAC&#x200b;AAT&#x200b;TTG&#x200b;GAT&#x200b;TTT&#x200b;GTA&#x200b;AAT&#x200b;TTT&#x200b;GAG&#x200b;TTG&#x200b;TGC&#x200b;ATT&#x200b;AAT&#x200b;TTT&#x200b;ATT&#x200b;TTG&#x200b;TAA&#x200b;ATG&#x200b;TAT&#x200b;TAT&#x200b;TTT&#x200b;TGA&#x200b;GAC&#x200b;TGA&#x200b;TCT&#x200b;GGC&#x200b;TCC&#x200b;ATA&#x200b;AAA&#x200b;ATC&#x200b;CTG&#x200b;GTT&#x200b;TTT&#x200b;ATT&#x200b;TGT&#x200b;AGT&#x200b;ATT&#x200b;CCT&#x200b;AGA&#x200b;AAG&#x200b;CTT&#x200b;ATT&#x200b;GTA&#x200b;TAT&#x200b;TTC&#x200b;TAG&#x200b;TCA&#x200b;AGC&#x200b;TTG&#x200b;AAA&#x200b;ATA&#x200b;AAT&#x200b;GTT&#x200b;AAA&#x200b;ATA&#x200b;TGG&#x200b;GTG&#x200b;AAA&#x200b;TAC&#x200b;GGA&#x200b;ACA&#x200b;AAA&#x200b;TAT&#x200b;AGA&#x200b;TCA&#x200b;TGC&#x200b;TAA&#x200b;ATA&#x200b;TAT&#x200b;ATA&#x200b;TAT&#x200b;ATA&#x200b;TGT&#x200b;ATA&#x200b;TAT&#x200b;TTG&#x200b;TGC&#x200b;TTT&#x200b;AAA&#x200b;TGA&#x200b;TTG&#x200b;CAC&#x200b;ATT&#x200b;TAC&#x200b;AAT&#x200b;CTT&#x200b;AGA&#x200b;AAG&#x200b;ACA&#x200b;GTA&#x200b;AAA&#x200b;GGT&#x200b;ATA&#x200b;AAT&#x200b;AAT&#x200b;AAA&#x200b;ATT&#x200b;ACA&#x200b;ATG&#x200b;AAT&#x200b;TAG&#x200b;TAT&#x200b;TTT&#x200b;GGA&#x200b;TTT&#x200b;TTT&#x200b;TTT&#x200b;TTT&#x200b;TTT&#x200b;TGC&#x200b;AAA&#x200b;AAA&#x200b;TGC&#x200b;TTC&#x200b;TCC&#x200b;TTT&#x200b;CTG&#x200b;GTC&#x200b;ACT&#x200b;ACA&#x200b;GAT&#x200b;ACA&#x200b;TTT&#x200b;GCT&#x200b;TTC&#x200b;ACA&#x200b;TAA&#x200b;AAT&#x200b;AAA&#x200b;ACA&#x200b;CAT&#x200b;AGT&#x200b;CAT&#x200b;ATC&#x200b;CCT&#x200b;TAT&#x200b;CAA&#x200b;ATG&#x200b;TGC&#x200b;ATT&#x200b;ACT&#x200b;GAA&#x200b;ACT&#x200b;GAA&#x200b;AAA&#x200b;CAC&#x200b;GTC&#x200b;TTT&#x200b;TAT&#x200b;TTG&#x200b;TTT&#x200b;GAT&#x200b;ATT&#x200b;GTG&#x200b;GCA&#x200b;AAA&#x200b;CTT&#x200b;GAG&#x200b;GTC&#x200b;TCA&#x200b;ATG&#x200b;CAA&#x200b;ATC&#x200b;ATA&#x200b;GAT&#x200b;CCC&#x200b;AAT&#x200b;AAC&#x200b;ACC&#x200b;AAC&#x200b;ATT&#x200b;CAC&#x200b;CTG&#x200b;TAA&#x200b;ACT&#x200b;TTT&#x200b;AGC&#x200b;ATT&#x200b;ACA&#x200b;TTA&#x200b;TAT&#x200b;TGC&#x200b;TGT&#x200b;TTA&#x200b;ATT&#x200b;CAC&#x200b;ACA&#x200b;GCG&#x200b;CTC&#x200b;ACA&#x200b;AAA&#x200b;CCA&#x200b;CTC&#x200b;GCA&#x200b;CGC&#x200b;CTG&#x200b;CAT&#x200b;TTC&#x200b;CCC&#x200b;TAT&#x200b;GCT&#x200b;AAT&#x200b;CAG&#x200b;ACG&#x200b;AAA&#x200b;TAG&#x200b;GAA&#x200b;GAA&#x200b;GTG&#x200b;CCT&#x200b;CCG&#x200b;AAT&#x200b;GCA&#x200b;GAA&#x200b;CCA&#x200b;CAA&#x200b;AGA&#x200b;TGT&#x200b;TTA&#x200b;TCT&#x200b;CGC&#x200b;TTT&#x200b;CGG&#x200b;CAC&#x200b;TTC&#x200b;ACA&#x200b;CCC&#x200b;AAA&#x200b;AAT&#x200b;AAT&#x200b;GTG&#x200b;CAG&#x200b;GTA&#x200b;GGA&#x200b;CCA&#x200b;GGA&#x200b;GAG&#x200b;CAG&#x200b;GAA&#x200b;GTG&#x200b;GAC&#x200b;TGT&#x200b;CAT&#x200b;TTT&#x200b;TTG&#x200b;TCG&#x200b;GAA&#x200b;TGT&#x200b;TTT&#x200b;TTT&#x200b;GCA&#x200b;ATC&#x200b;TGG&#x200b;GGC&#x200b;ATC&#x200b;AAG&#x200b;CTC&#x200b;CTC&#x200b;TTC&#x200b;CTG&#x200b;TTC&#x200b;CTG&#x200b;GAG&#x200b;GAA&#x200b;TAA&#x200b;AGC&#x200b;CCA&#x200b;CAT&#x200b;TTT<bold>AAT&#x200b;GAT&#x200b;GCT&#x200b;CAT&#x200b;CCT&#x200b;CTG&#x200b;CTT&#x200b;GTT&#x200b;CAC&#x200b;TGCTC&#x200b;GAG</bold>.</p>
<p>TT sequence: GCT&#x200b;AGC&#x200b;ACAT&#x200b;AAA&#x200b;TCC&#x200b;AAT&#x200b;TCA&#x200b;TTT&#x200b;AGC&#x200b;GAA&#x200b;AAT&#x200b;ATT&#x200b;TAT&#x200b;TTT&#x200b;TAC&#x200b;GAT&#x200b;ATT&#x200b;TAT&#x200b;GAA&#x200b;TTG&#x200b;CGA&#x200b;ATT&#x200b;GTG&#x200b;TGT&#x200b;TGT&#x200b;ATT&#x200b;TAT&#x200b;GAG&#x200b;TTG&#x200b;TGT&#x200b;TTT&#x200b;GCA&#x200b;TTT&#x200b;ACA&#x200b;ATT&#x200b;TGG&#x200b;ATT&#x200b;TTG&#x200b;TAA&#x200b;ATT&#x200b;TTG&#x200b;AGT&#x200b;TGT&#x200b;GCA&#x200b;TTA&#x200b;ATT&#x200b;TTA&#x200b;TTT&#x200b;TGT&#x200b;AAA&#x200b;TGT&#x200b;ATT&#x200b;ATT&#x200b;TTT&#x200b;GAG&#x200b;ACT&#x200b;GAT&#x200b;CTG&#x200b;GCT&#x200b;CCA&#x200b;TAA&#x200b;AAA&#x200b;TCC&#x200b;TGG&#x200b;TTT&#x200b;TTA&#x200b;TTT&#x200b;GTA&#x200b;GTA&#x200b;TTC&#x200b;CTA&#x200b;GAA&#x200b;AGC&#x200b;TTA&#x200b;TTG&#x200b;TAT&#x200b;ATT&#x200b;TCT&#x200b;AGT&#x200b;CAA&#x200b;GCT&#x200b;TGA&#x200b;AAA&#x200b;TAA&#x200b;ATG&#x200b;TTA&#x200b;AAA&#x200b;TAT&#x200b;GGG&#x200b;TGA&#x200b;AAT&#x200b;ACG&#x200b;GAA&#x200b;CAA&#x200b;AAT&#x200b;ATA&#x200b;GAT&#x200b;CAT&#x200b;GCT&#x200b;AAA<bold>&#x7c;</bold>TAT&#x200b;ATA&#x200b;TTT&#x200b;GTG&#x200b;CTT&#x200b;TAA&#x200b;ATT&#x200b;ATT&#x200b;GCA&#x200b;CAT&#x200b;TTA&#x200b;CAA&#x200b;TCT&#x200b;TAG&#x200b;AAA&#x200b;GAC&#x200b;AGT&#x200b;AAA&#x200b;AGG&#x200b;TAT&#x200b;AAA&#x200b;TAA&#x200b;TAA&#x200b;AAT&#x200b;TAC&#x200b;AAT&#x200b;GAA&#x200b;TTA&#x200b;GTA&#x200b;TTT&#x200b;TGG&#x200b;ATT&#x200b;TTT&#x200b;TTT&#x200b;TTT&#x200b;TTT&#x200b;TTG&#x200b;CAA&#x200b;AAA&#x200b;ATG&#x200b;CTT&#x200b;CTC&#x200b;CTT&#x200b;TCT&#x200b;GGT&#x200b;CAC&#x200b;TAC&#x200b;AGA&#x200b;TAC&#x200b;ATT&#x200b;TGC&#x200b;TTT&#x200b;CAC&#x200b;ATA&#x200b;AAA&#x200b;TAA&#x200b;AAC&#x200b;ACA&#x200b;TAG&#x200b;TCA&#x200b;TAT&#x200b;CCC&#x200b;TTA&#x200b;TCA&#x200b;AAT&#x200b;GTG&#x200b;CAT&#x200b;TAC&#x200b;TGA&#x200b;AAC&#x200b;TGA&#x200b;AAA&#x200b;ACA&#x200b;CGT&#x200b;CTT&#x200b;TTA&#x200b;TTT&#x200b;GTT&#x200b;TGA&#x200b;TAT&#x200b;TGT&#x200b;GGC&#x200b;AAA&#x200b;ACT&#x200b;TGA&#x200b;GGT&#x200b;CTC&#x200b;AAT&#x200b;GCA&#x200b;AAT&#x200b;CAT&#x200b;AGA&#x200b;TCC&#x200b;CAA&#x200b;TAA&#x200b;CAC&#x200b;CAA&#x200b;CAT&#x200b;TCA&#x200b;CCT&#x200b;GTA&#x200b;AAC&#x200b;TTT&#x200b;TAG&#x200b;CAT&#x200b;TAC&#x200b;ATT&#x200b;ATA&#x200b;TTG&#x200b;CTG&#x200b;TTT&#x200b;AAT&#x200b;TCA&#x200b;CAC&#x200b;AGC&#x200b;GCT&#x200b;CAC&#x200b;AAA&#x200b;ACC&#x200b;ACT&#x200b;CGC&#x200b;ACG&#x200b;CCT&#x200b;GCA&#x200b;TTT&#x200b;CCC&#x200b;CTA&#x200b;TGC&#x200b;TAA&#x200b;TCA&#x200b;GAC&#x200b;GAA&#x200b;ATA&#x200b;GGA&#x200b;AGA&#x200b;AGT&#x200b;GCC&#x200b;TCC&#x200b;GAA&#x200b;TGC&#x200b;AGA&#x200b;ACC&#x200b;ACA&#x200b;AAG&#x200b;ATG&#x200b;TTT&#x200b;ATC&#x200b;TCG&#x200b;CTT&#x200b;TCG&#x200b;GCA&#x200b;CTT&#x200b;CAC&#x200b;ACC&#x200b;CAA&#x200b;AAA&#x200b;TAA&#x200b;TGT&#x200b;GCA&#x200b;GGT&#x200b;AGG&#x200b;ACC&#x200b;AGG&#x200b;AGA&#x200b;GCA&#x200b;GGA&#x200b;AGT&#x200b;GGA&#x200b;CTG&#x200b;TCA&#x200b;TTT&#x200b;TTT&#x200b;GTC&#x200b;GGA&#x200b;ATG&#x200b;TTT&#x200b;TTT&#x200b;TGC&#x200b;AAT&#x200b;CTG&#x200b;GGG&#x200b;CAT&#x200b;CAA&#x200b;GCT&#x200b;CCT&#x200b;CTT&#x200b;CCT&#x200b;GTT&#x200b;CCT&#x200b;GGA&#x200b;GGA&#x200b;ATA&#x200b;AAG&#x200b;CCC&#x200b;ACA&#x200b;TTT&#x200b;T<bold>AAT&#x200b;GAT&#x200b;GCT&#x200b;CAT&#x200b;CCT&#x200b;CTG&#x200b;CTT&#x200b;GTT&#x200b;CAC&#x200b;TGCTC&#x200b;GAG</bold>.</p>
<p>After 8&#xa0;h of, cells were treated with either vehicle (0.1% DMSO), 500&#xa0;nM abamectin (Sigma &#x23;31732), or 5&#xa0;&#x3bc;M abamectin in triplicate for each condition. After 48&#xa0;h, the cells were harvested for reporter gene activity. A luciferase assay and &#x3b2;-gal assay were run on the harvested cells. The raw luciferase values were normalized to the &#x3b2;-gal values.</p>
</sec>
<sec id="s2-5-2">
<title>2.5.2 Statistical Methods</title>
<p>Data from the luciferase assay was analyzed in R (<xref ref-type="bibr" rid="B28">R Core Team, 2020</xref>). The <italic>lm</italic> command from the stats package was used to build a linear model to estimate differences between inserts and identify any interactions between dose and insert. One-way ANOVA was done in R to compare across dose (0, 0.5, 5&#xa0;&#x3bc;M abamectin) and insert (control, TT or, GG) and to test for interaction between all dose and insert combinations. Tukey&#x2019;s honest significant difference test was used to compare different insert, dose pairs using <italic>tukeyHSD</italic> from r stats.</p>
</sec>
</sec>
<sec id="s2-6">
<title>2.6 Electrophoretic Mobility Shift Assay</title>
<sec id="s2-6-1">
<title>2.6.1 Embryo Preparation</title>
<p>At 48&#xa0;hpf embryonic chorions were mechanically removed with forceps for any unhatched embryos and three pools of 120 embryos each were collected. Embryos were anesthetized with 0.0072% tricaine methanesulfonate prior to protein extraction.</p>
</sec>
<sec id="s2-6-2">
<title>2.6.2 Nuclear Protein Extraction</title>
<p>Manufactures protocol for tissue nuclear protein extraction was followed using ThermoFisher NE-PER nuclear and Cytoplasmic Extraction Kit (78833) and Halt Protease Inhibitor Cocktail, EDTA-free (&#xd7;100) (78425) without modifications. Final nuclear extract volume was 200&#xa0;&#x3bc;l per sample.</p>
<p>Nuclear protein fraction concentrations were calculated using Pierce BCA Protein Assay kit (ThermoFisher, &#x23;23225) and a Beckman DU800 spectrophotometer. Extracts ranged from 1.8 to 2.2&#xa0;&#x3bc;g/&#x3bc;l.</p>
</sec>
<sec id="s2-6-3">
<title>2.6.3 Oligo Design</title>
<p>Oligo sequences were chosen using predicted binding site sequence for the upstream region of <italic>sox7</italic> from the Genomatix analysis. Both sequences were design to be 26&#xa0;bps long so that binding differences couldn&#x2019;t be attributed to differences in length. The TT oligo contains the sequence on either side of the indel with the deletion. The TT oligo is extended by 16&#xa0;bps in the 3&#x2032; direction, following the sequence in the region of interest to reach the required 26&#xa0;bps.</p>
</sec>
<sec id="s2-6-4">
<title>2.6.4 Oligo Preparation</title>
<p>Single strand oligos were synthesized by IDT, (San Diego, CA, United States) as either unlabeled or 5&#x2032; end labeled with LI-COR IRDye<sup>&#xae;</sup> 700. The oligo sequences are as follows:</p>
<p>Labeled Sense GG version: 5&#x2032;IRD700/CATGCTAAATATATATATATATATGT.</p>
<p>Labeled Antisense GG version: 5&#x2032;IRD700/ACATATATATATATATATTTAGCATG.</p>
<p>Unlabeled competition GG version sense: 5&#x2032;CAT&#x200b;GCT&#x200b;AAA&#x200b;TAT&#x200b;ATA&#x200b;TAT&#x200b;ATA&#x200b;TAT&#x200b;GT.</p>
<p>Unlabeled competition GG version antisense: 5&#x2032;ACA&#x200b;TAT&#x200b;ATA&#x200b;TAT&#x200b;ATA&#x200b;TAT&#x200b;TTA&#x200b;GCA&#x200b;TG.</p>
<p>Unlabeled competition TT version sense: 5&#x2032;CAT&#x200b;GCT&#x200b;AAA&#x7c;TAT&#x200b;ATA&#x200b;TTT&#x200b;GTG&#x200b;CTT&#x200b;TA.</p>
<p>Unlabeled competition TT version antisense: 5&#x2032;TAA&#x200b;AGC&#x200b;ACA&#x200b;AAT&#x200b;ATA&#x200b;TAT&#x200b;TTA&#x200b;GCA&#x200b;TG.</p>
<p>Oligos were reconstituted in TE buffer (10&#xa0;mM Tris, 1&#xa0;mM EDTA, pH 8.0) and diluted to 20&#xa0;&#x3bc;M. Sense and complimentary antisense oligos were annealed by mixing 20&#xa0;&#x3bc;l of each paired strand, heating at 100&#xb0; for 5&#xa0;min followed by slowly cooling tube in heat block to room temperature overnight. Annealed IR700 oligo was then further diluted 1:200 and small aliquots were stored at &#x2212;20&#xb0;C. Competitor oligos stocks were kept at 20&#xa0;&#x3bc;M equaling &#xd7;200 the labeled oligo concentration.</p>
</sec>
<sec id="s2-6-5">
<title>2.6.5 Binding and Competition Assays</title>
<p>Odyssey EMSA Kit reagents were purchased from LI-COR Biosciences, Inc., Lincoln, NE, United States, Optimization for DNA/protein binding conditions were performed according to manufactures suggested protocol. Optimal binding buffer components were found to be as follows: 2&#xa0;&#x3bc;l 10&#xd7; Binding Buffer, 2ul 25&#xa0;mM DTT/2.5% Tween20, 1&#xa0;&#x3bc;l 1&#xa0;M KCL, 1&#xa0;&#x3bc;l 100&#xa0;nM end-labeled oligo (100&#xa0;fmol), 5.6&#xa0;&#x3bc;g nuclear protein extract, water to final 20&#xa0;&#x3bc;l volume. Optimization trials with varying concentrations of poly (dI&#xb7;dC) indicated it interfered with DNA binding and was left out of subsequent runs. Reagents were mixed in microtube and incubated for 30&#xa0;min at room temperature. 2&#xa0;&#x3bc;l of &#xd7;10 Orange load dye was added immediately before loading entire sample in to wells of a BioRad Mini-Protean 5% TBE precast gel. Electrophoresis was run in &#xd7;0.5 TBE buffer at 70&#xa0;V for 60&#x2013;70&#xa0;min.</p>
<p>For competition assays, unlabeled oligos were tested in a range from &#xd7;200 down to &#xd7;12.5 (20&#x2013;1.25&#xa0;pmol) of IR700 oligo concentration. Competitors were added to reaction mix first and incubated for 10&#xa0;min to allow binding to protein before addition of labeled oligo. Reaction then incubated 20&#xa0;min longer. Images were acquired on the Azure 600 Imaging System, (Azure Biosystems, Inc., Dublin, CA, United States) and image was inverted for better definition.</p>
</sec>
</sec>
</sec>
<sec id="s3">
<title>3 Results</title>
<sec id="s3-1">
<title>3.1 Deep Reanalysis of Region Associated With Responses to Exposure</title>
<p>Utilizing data from previous GWAS work published in <xref ref-type="bibr" rid="B2">Balik-Meisner et al. (2018a)</xref> and previous HTS data from <xref ref-type="bibr" rid="B36">Truong et al. (2014)</xref> the region identified as being associated with differences in individual susceptibility to abamectin exposure was analyzed to identify further genetic differences that may be contributing to susceptibility differences across fish (<xref ref-type="bibr" rid="B36">Truong et al., 2014</xref>; <xref ref-type="bibr" rid="B3">Balik-Meisner et al., 2018b</xref>). This analysis identified multiple SNPs and an Indel that showed significant association with these differences in susceptibility. The most significantly associated SNP as well as the indel can be seen in <xref ref-type="fig" rid="F2">Figure 2</xref>. These polymorphisms represent the most common alleles in a highly variable region of the zebrafish genotype upstream of <italic>sox7</italic>, an important gene in development (<xref ref-type="bibr" rid="B31">Stovall et al., 2014</xref>).</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Multiple sequence alignment that displays examples of the two primary genotypes (TT and GG) the larger deletion can be seen tied to the T genotype. The indel is highlighted by a green bracket while a red rectangle highlights the SNPs. These features are also highlight on a drawing that represents the results of the transcription factor binding site prediction. The colored ovals represent different proteins, with three different representative individuals showing how protein binding is predicted differently by the software in different individuals.</p>
</caption>
<graphic xlink:href="ftox-04-846221-g002.tif"/>
</fig>
<p>The G/T SNP was associated with the indel in that the T allele was always paired with the deletion whereas the G allele was not. The T genotype was associated with increased susceptibility to abamectin exposure. These polymorphisms are displayed in <xref ref-type="table" rid="T1">Table 1</xref>. These polymorphisms are both upstream of <italic>sox7</italic> and located within a non-coding region.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>The SNP and Indel with variants listed as the reference (0) and alternate (1) alleles. Prevalence of the homozygous genotypes for both variants in affected and unaffected fish are shown in the table with the total number of fish with both genotypes at the bottom.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="left"/>
<th colspan="2" align="center">Ref: G (0) Alt: T (1) Pos: 19066027</th>
<th colspan="2" align="center">Ref: ATATATATATATATATG (0) Alt: A (1) Pos: 19065990</th>
</tr>
<tr>
<th align="center">0/0</th>
<th align="center">1/1</th>
<th align="center">0/0</th>
<th align="center">1/1</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Affected</td>
<td align="center">58</td>
<td align="center">20</td>
<td align="center">33 (30 are G/G)</td>
<td align="center">16 (All T/T)</td>
</tr>
<tr>
<td align="left">Unaffected</td>
<td align="center">78</td>
<td align="center">9</td>
<td align="center">51 (50 are G/G)</td>
<td align="center">8 (All T/T)</td>
</tr>
<tr>
<td align="left">Total</td>
<td align="center">136</td>
<td align="center">29</td>
<td align="center">84</td>
<td align="center">24</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-2">
<title>3.2 <italic>In Silico</italic> Analysis to Identify Possible Mechanisms</title>
<sec id="s3-2-1">
<title>3.2.1 Transcription Factor Binding Site Prediction</title>
<p>One possible mechanism wherein an upstream sequence causes differential expression that leads to susceptibility differences is by acting as enhancers or promoters that recruit different transcription factors, leading to differential regulation of the downstream gene. The pathway enrichment analysis tool in the Comparative Toxicogenomics Database (CTD) shows that abamectin is enriched for effects on the signal transduction pathway which contains <italic>sox7</italic> (<xref ref-type="bibr" rid="B8">Davis et al., 2019</xref>). To test this possibility, transcription factor binding site prediction was employed using the Matbase package that is a part of the Genomatix software (<xref ref-type="bibr" rid="B7">Cartharius et al., 2005</xref>). Many differences in TFBSs were identified across all fish in the region upstream of <italic>sox7</italic>. Several of these were in the region that contains the indel and SNP. Some of these predicted sites are illustrated in <xref ref-type="fig" rid="F3">Figure 3</xref> and all predicted binding sites are present in <xref ref-type="sec" rid="s11">Supplementary Table S1</xref>.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Predicted transcription factor binding sites that are in the region of interest. This sequence contains the insert and the G polymorphism of the SNP with the predicted binding sites bracketed and labelled.</p>
</caption>
<graphic xlink:href="ftox-04-846221-g003.tif"/>
</fig>
</sec>
<sec id="s3-2-2">
<title>3.2.2 Analysis of Predicted Transcription Factor Binding Site</title>
<p>To identify significant differences between TFBSs, a chi-squared test was used to compare differences between TFBSs between all of the identified polymorphisms. Two different sequences stood out as having multiple highly significant differences between predicted TFBSs. One which contained the deletion that was previously identified as well as the T allele of the G/T SNP (TT) and one which contained the G allele (GG).</p>
<p>Predicted TFBSs with significant chi-squared values that were within the region of interest containing the SNP and indel (<xref ref-type="fig" rid="F4">Figure 4</xref>.) were identified. Differential protein binding of these proteins <italic>in vivo</italic> could contribute to susceptibility differences in individuals with differing sequences at this locus.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Heatmap showing all binding sites predicted to bind the GG sequence. The <italic>y</italic> axis shows the name of each predicted binding site. The <italic>x</italic> axis shows the distance of each predicted site from the region beginning with the indel and ending with the SNP. The colors, ranging from dark pink to yellow represent the chi-squared value when the predicted binding sites of the GG and TT genotypes are analyzed with a chi-squared test.</p>
</caption>
<graphic xlink:href="ftox-04-846221-g004.tif"/>
</fig>
</sec>
</sec>
<sec id="s3-3">
<title>3.3 Evaluating Protein Binding Between Sequences</title>
<sec id="s3-3-1">
<title>3.3.1 Electrophoretic Mobility Shift Assay Binding Assay</title>
<p>EMSA was done to establish protein-DNA interaction of the GG sequence <italic>in vitro</italic>. The first assay evaluated if the GG sequence was able to bind protein in zebrafish protein lysate. As seen in <xref ref-type="fig" rid="F5">Figure 5</xref> the sequence was shown to bind to a protein in the lysate.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>EMSA showing a competition assay done with varying concentrations of untagged GG and TT oligos. The first lane has no competitors in it and demonstrates the shift that happens when the tagged GG oligo and the protein lysate are added to the well. The band is highlighted by a red arrow. An example of the difference in bands when the GG or TT competitors are added is highlighted with a red box. The GG competitor produces a much lighter band, indicating that the GG sequence has more affinity for the protein that is being bound than the TT sequence.</p>
</caption>
<graphic xlink:href="ftox-04-846221-g005.tif"/>
</fig>
</sec>
<sec id="s3-3-2">
<title>3.3.2 Electrophoretic Mobility Shift Assay Competition Assay</title>
<p>To determine if the sequences had different binding affinities to the same protein a competition binding assay was done with a tagged GG oligo and an excess of untagged competitor TT or GG oligos at varying concentrations. If the competitors bound the same proteins with different affinities the untagged TT would pull away protein from the tagged GG sequence but with less efficiency than the untagged GG oligo. This would appear as a fainter band in wells that contained the untagged GG oligo compared to wells that contained the untagged TT oligo indicating that the TT sequence bound with less affinity than the GG sequence. <xref ref-type="fig" rid="F5">Figure 5</xref> indicates that this is the case. A fainter band can be identified clearly in several GG competition lanes when compared to the same concentrations of the TT competition wells. These results indicate that these two sequences bind differentially to the same protein.</p>
</sec>
</sec>
<sec id="s3-4">
<title>3.4 Investigating the Regulatory Activity of Different Sequences</title>
<sec id="s3-4-1">
<title>3.4.1 Luciferase Assay</title>
<p>The substantial predicted binding site differences between the GG and TT sequences, and the differential protein binding that was identified indicate that this locus may play an important role in <italic>sox7</italic> expression. To test if these polymorphisms alone, along with their different binding behavior could lead to expression differences, TT and GG were inserted into luciferase vectors which were transfected into MCF7 cells. <xref ref-type="fig" rid="F6">Figure 6</xref> shows luciferase expression in the cells across the three doses.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Bar chart displaying the average luciferase activity across three different vector inserts (GG, TT, and control) at 0&#xa0;&#x3bc;M <bold>(A)</bold> and 0.5&#xa0;&#x3bc;M <bold>(A)</bold> and 5&#xa0;&#x3bc;M abamectin <bold>(C)</bold>. The GG vector (left most) has higher expression in all three environments. The TT vector (middle) and control vector (right most) look similar and show lower expression except in response to the highest level of abamectin expression.</p>
</caption>
<graphic xlink:href="ftox-04-846221-g006.tif"/>
</fig>
</sec>
<sec id="s3-4-2">
<title>3.4.2 Statistical Analysis</title>
<p>Significant differences were found in luciferase expression across inserts in an ANOVA (Df &#x3d; 2, F &#x3d; 41.4, <italic>p</italic> &#x3d; 5.1e&#x2212;8). When compared using Tukey&#x2019;s test, cells with the TT or GG insert showed significant differences in luciferase expression (<italic>p</italic> adjusted &#x3d; 4.6e&#x2212;4). Cells with the TT or GG insert that were exposed to 0.5&#xa0;&#x3bc;M of abamectin also showed significant expression differences as well (<italic>p</italic> adjusted &#x3d; 4.7e&#x2212;4). There was also a significant difference between the GG cells and the control vector transfected cells when there was no exposure (<italic>p</italic> adjusted &#x3d; 1.3e&#x2212;04) and when they were exposed to 0.5&#xa0;&#x3bc;M of abamectin (<italic>p</italic> adjusted &#x3d; 2.7e&#x2212;03). The TT cells and control cells behaved similarly with regards to luciferase expression with no significant differences identified between them at either dose. There were no observed changes in expression in the cells with the same vector at different doses. While not visually apparent across the first two doses, abamectin dose had a significant affect on <italic>sox7</italic> expression when comparing across all three doses in a linear regression (<italic>t</italic> &#x3d; &#x2212;4.29, <italic>p</italic> &#x3d; 0.003).</p>
</sec>
</sec>
</sec>
<sec id="s4">
<title>4 Discussion</title>
<p>The results of this study reinforce the hypothesis that the sequences upstream of <italic>sox7</italic> containing the SNP and Indel that were profiled in this study act as regulators of the <italic>sox7</italic> gene, where regulatory differences caused by the two genotypes lead to differences in susceptibility to chemical exposure. The position of the variants upstream of Sox7 in a non-coding region, combined with the fact that two specific variants were highly associated with different outcomes after exposure points to the possibility that these sequences play a regulatory role in the expression of <italic>sox7</italic> as promoters, enhancers, and/or repressors. One mechanism that could explain the substantial differences in the effects of exposure and the expression of <italic>sox7</italic> is that these variants, in their role as regulators, bind different transcription factors. These binding differences then instigate differential regulation of Sox7 expression which leads to discrepancies in susceptibility to developmental defects brought on by chemical exposure.</p>
<p>
<italic>In silico</italic> analysis was done to look at possible TFBS differences between the two sequences which could bring about the observed expression differences. This analysis predicted that many of the TFBSs differed at the deletion and SNP loci. This led to the conclusion that these two sequences likely bind some factor with differing affinity, resulting in the observed expression differences between individuals with different genotypes. These results were used to guide further wet-lab experimentation.</p>
<p>Using EMSA, the ability of these sequences to bind protein was investigated. The results of the initial EMSA looking at the ability of the GG sequences to bind protein <italic>in vitro</italic> demonstrated that it bound a protein that is present during zebrafish development. A second EMSA, looking at competition between the two sequences, illustrated that there were pronounced differences in binding affinity between the two variants.</p>
<p>Binding differences between two sequences does not necessarily explain the expression differences that were associated with different developmental outcomes. A luciferase assay clearly displayed significant expression differences that were precipitated by the two different genotypes when inserted, with a minimal promoter, into human cells. This demonstrates that even without the longer promoter sequence; the SNP and indel were sufficient to change <italic>sox7</italic> expression.</p>
<p>The mechanism of differential susceptibility identified in this study is as follows: The differences in the hypervariable region upstream of <italic>sox7</italic> lead to differences in the suite of transcription factors that bind the DNA to affect <italic>sox7</italic> expression. This, in turn, causes differential expression of the important developmental factor Sox7. These expression differences during an organism&#x2019;s development contribute to susceptibility differences between organisms when exposed to abamectin. While the next steps in the adverse outcome pathway are subject to additional studies, we hypothesize that these expression differences might be connected to a developmental pathway involving <italic>sox7</italic> that is disrupted by abamectin without being able to compensate by expressing more protein.</p>
<p>Sox7 plays a crucial role in development in humans and fish alike (<xref ref-type="bibr" rid="B31">Stovall et al., 2014</xref>). Sox7 plays an especially important role in the development of hematopoietic pathways and vasculogenesis in many vertebrates including zebrafish, humans, and rodents (<xref ref-type="bibr" rid="B46">Pendeville et al., 2008</xref>; <xref ref-type="bibr" rid="B49">Francois et al., 2010</xref>; <xref ref-type="bibr" rid="B42">Carroll and North, 2014</xref>; <xref ref-type="bibr" rid="B44">Lomel&#xed; and Castillo-Castellanos, 2020</xref>). Differential expression of <italic>sox7</italic> could, therefore, cause susceptibility differences to chemical exposure, particularly during development. Sox7 downregulation has also been linked to breast cancer in humans (<xref ref-type="bibr" rid="B31">Stovall et al., 2014</xref>). Changes in the regulatory sequence upstream of SOX7 may be one factor responsible for these changes in expression related to breast cancer.</p>
<p>This study identified a hypervariable region upstream of the zebrafish <italic>sox7</italic> gene. Analysis of the region upstream of SOX7 in the Ensembl human genome assembly (GRCh38.p13) shows a known promoter and enhancer region on chromosome 8 from base pairs 10730506 to 10736999 (Chromosome 8: 10,730,506&#x2013;10,736,999, 8). The genome aggregation database (GnomAD) contains over 700 short variants (SNPs and Indels) that have been identified in this region but have not been investigated for phenotypic effects nor ties to susceptibility differences after chemical exposure (8-10730506-10736999 &#x7c; gnomAD v2.1.1 &#x7c; gnomAD). Non-coding regions are understudied, and there is little information on the evolutionary conservation of the region upstream of SOX7 between zebrafish and humans. Studies on the protein itself, though, have shown that there is 78% identity between the human and the zebrafish protein (<xref ref-type="bibr" rid="B49">Francois et al., 2010</xref>). This points to similarities being conserved across humans and zebrafish in this region that could point to important implications regarding human susceptibility to abamectin and other compounds that affect development through interactions with SOX7. Further investigation could use human data on exposure to abamectin and other related compounds (see concluding paragraph below) to uncover possible GxE and susceptibility differences that were implicated in this study and flagged in the initial high-throughput screening. The broader implications of this study are that a high-throughput screening method in a diverse population can successfully identify compounds that elicit GxE causing observable effects.</p>
<p>Zebrafish are the only vertebrate model that is currently compatible with high-throughput methods and shares a large degree of evolutionary conservation with humans (<xref ref-type="bibr" rid="B14">Garcia et al., 2016</xref>). Moreover, the HTS experiments described here cover the phylotypic stage, wherein vertebrate development across taxa are most similar, making developmental comparisons across vertebrates especially useful (<xref ref-type="bibr" rid="B14">Garcia et al., 2016</xref>). Zebrafish have proven especially useful in the study of human fetal development, vasculogenesis, hematopoiesis, brain development, thyroid function, and the hypothalamic-pituitary-thyroid axis (<xref ref-type="bibr" rid="B46">Pendeville et al., 2008</xref>, <xref ref-type="bibr" rid="B47">Liu et al., 2013</xref>; <xref ref-type="bibr" rid="B42">Carroll and North, 2014</xref>; <xref ref-type="bibr" rid="B43">Duboc et al., 2015</xref>; <xref ref-type="bibr" rid="B14">Garcia et al., 2016</xref>; <xref ref-type="bibr" rid="B48">Vancamp and Darras, 2018</xref>; <xref ref-type="bibr" rid="B44">Lomel&#xed; and Castillo-Castellanos, 2020</xref>). Thus, an HTS-compatible zebrafish model is adaptable to identifying GxE mechanisms behind susceptibility differences to chemical exposure that may be of direct human relevance. In future studies of additional exposures, the discovery path described here would necessarily be tailored or branched according to empirical results. This flexible method lays a foundation for the rapid discovery of chemicals that participate in GxE and the unraveling of their mechanisms.</p>
<p>Despite the promise and functionality of this high-throughput discovery method, the model that is being utilized does have drawbacks. The speed at which the screening is done imposes constraints on the breadth and depth of the analysis. As with any model, zebrafish are not a sufficient substitute for human studies. While they serve as important models that share a great deal of similarity with humans, there are many mechanistic and genetic differences between humans and zebrafish. Examples of studies aiming to understand these differences have documented how hematopoiesis occurs in a different organ, primitive blood cells are only unipotent, and there are some differences in signaling during development (<xref ref-type="bibr" rid="B42">Carroll and North, 2014</xref>; <xref ref-type="bibr" rid="B43">Duboc et al., 2015</xref>; <xref ref-type="bibr" rid="B44">Lomel&#xed; and Castillo-Castellanos, 2020</xref>).</p>
<p>Considering these strengths and limitations, we propose zebrafish HTS as an approach to begin addressing the paucity of information on GxE causing individual susceptibility differences to the tens of thousands of chemicals in the growing exposome. Analysis at this scale could rapidly screen for signals that require further investigation. Future studies would then be able to find mechanisms of GxE involving compounds of public health interest by following the information gleaned from HTS. Moreover, while identification of new and underinvestigated compounds that may be tied to differential susceptibility presents on ongoing challenge, the same critical question must be asked of otherwise well-studied compounds. In this manner, human health can be improved by new knowledge regarding existing, new, and well-studied compounds. Abamectin acts as a case study in the importance of gaining a better understanding of well-studied chemicals like the mectin family of compounds, where new exposures and usage patterns can introduce population health concerns. As illustration, consider data from the Centers for Disease Control showing that prescriptions for ivermectin for humans increased more than ten-fold, from 3,600 to 39,000, in 2020 amidst the COVID-19 pandemic (<xref ref-type="bibr" rid="B45">Health Alert Network (HAN), 2021</xref>). This method uses high-dimensional HTS data are interrogated for signals of differential susceptibility, also addresses some of the problems related to the assessment of differential individual susceptibility to chemical exposure. Namely, problems with sample sizes of sufficient power, mechanistic investigation, environmental variables, and the relationship between exposure and effect. Combining novel <italic>in silico</italic> and HT methods with existing <italic>in vitro</italic> and <italic>in vivo</italic> methods, this approach could lead to a new understanding of GxE and differential susceptibility that changes the current paradigm for parsing out GxE in diverse populations. Understanding GxE and the factors that contribute to susceptibility can lead to better risk assessment, a better grasp on the effects of a chemical, more effective regulation to improve human health, and an increasing knowledge of adverse outcome pathways.</p>
</sec>
</body>
<back>
<sec id="s5">
<title>Data Availability Statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found below: <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/">https://www.ncbi.nlm.nih.gov/</ext-link>, PRJNA482650.</p>
</sec>
<sec id="s6">
<title>Ethics Statement</title>
<p>The animal study was reviewed and approved by the Oregon State University Institutional Animal Care and Use Committee approved protocol.</p>
</sec>
<sec id="s7">
<title>Author Contributions</title>
<p>DW drafted the manuscript. DW and PT performed analysis. JD, LT, DE, SK and RT generated experimental data. RT and DR obtained funding. All authors contributed to the study design and manuscript editing. All authors agreed to accountability for the content.</p>
</sec>
<sec id="s8">
<title>Funding</title>
<p>This work was supported by the National Institutes of Health (R56 ES030007, P42 ES016465, P30 ES030287, P42 ES031009, and P30 ES025128) and the Environmental Protection Agency (R839481).</p>
</sec>
<sec sec-type="COI-statement" id="s9">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s10">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ack>
<p>The authors would like to acknowledge the contributions of Joshua White (Oregon State University) for performing EMSAs, and Russell Schaaf (Oregon State University) for assistance with cloning.</p>
</ack>
<sec id="s11">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/ftox.2022.846221/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/ftox.2022.846221/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material>
<label>Supplementary Table S1</label>
<caption>
<p>Predicted transcription factor binding sites in the region upstream of sox7 in T5D zebrafish.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="DataSheet1.DOCX" id="SM1" mimetype="application/DOCX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Anastassiadou</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Arena</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Auteri</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Brancato</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Bura</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Carrasco Cabrera</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Peer Review of the Pesticide Risk Assessment of the Active Substance Abamectin</article-title>. <source>Efs</source> <volume>18</volume> (<issue>8</issue>), <fpage>e06227</fpage>. <pub-id pub-id-type="doi">10.2903/j.efsa.2020.6227</pub-id> </citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Balik-Meisner</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Truong</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Scholl</surname>
<given-names>E. H.</given-names>
</name>
<name>
<surname>La Du</surname>
<given-names>J. K.</given-names>
</name>
<name>
<surname>Tanguay</surname>
<given-names>R. L.</given-names>
</name>
<name>
<surname>Reif</surname>
<given-names>D. M.</given-names>
</name>
</person-group> (<year>2018a</year>). <article-title>Elucidating Gene-By-Environment Interactions Associated with Differential Susceptibility to Chemical Exposure</article-title>. <source>Environ. Health Perspect.</source> <volume>126</volume> (<issue>6</issue>), <fpage>067010</fpage>. <pub-id pub-id-type="doi">10.1289/EHP2662</pub-id> </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Balik-Meisner</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Truong</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Scholl</surname>
<given-names>E. H.</given-names>
</name>
<name>
<surname>Tanguay</surname>
<given-names>R. L.</given-names>
</name>
<name>
<surname>Reif</surname>
<given-names>D. M.</given-names>
</name>
</person-group> (<year>2018b</year>). <article-title>Population Genetic Diversity in Zebrafish Lines</article-title>. <source>Mamm. Genome</source> <volume>29</volume> (<issue>1&#x2013;2</issue>), <fpage>90</fpage>&#x2013;<lpage>100</lpage>. <pub-id pub-id-type="doi">10.1007/s00335-018-9735-x</pub-id> </citation>
</ref>
<ref id="B41">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Barton</surname>
<given-names>C. L.</given-names>
</name>
<name>
<surname>Johnson</surname>
<given-names>E. W.</given-names>
</name>
<name>
<surname>Tanguay</surname>
<given-names>R. L.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Facility Design and Health Management Program at the Sinnhuber Aquatic Research Laboratory</article-title>. <source>Zebrafish</source>. <volume>S-39&#x2013;S-43</volume>. <pub-id pub-id-type="doi">10.1089/zeb.2015.1232</pub-id> </citation>
</ref>
<ref id="B4">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Bergeson</surname>
<given-names>L. L.</given-names>
</name>
</person-group> (<year>2000</year>). <source>1953 TSCA : Toxic Substances Control Act; Chicago, Ill. : Section of Environment, Energy, and Resources</source>. <publisher-loc>Chicago</publisher-loc>: <publisher-name>American Bar Association</publisher-name>. <comment>[2000] &#xa9;2000</comment>. </citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bolger</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Lohse</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Usadel</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Trimmomatic: A Flexible Trimmer for Illumina Sequence Data</article-title>. <source>Bioinformatics</source> <volume>30</volume> (<issue>15</issue>), <fpage>2114</fpage>&#x2013;<lpage>2120</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu170</pub-id> </citation>
</ref>
<ref id="B6">
<citation citation-type="web">
<collab>bwa.1</collab> (<year>2021</year>). <comment>Available at: <ext-link ext-link-type="uri" xlink:href="http://bio-bwa.sourceforge.net/bwa.shtml">http://bio-bwa.sourceforge.net/bwa.shtml</ext-link> (accessed 1208 2021</comment>.</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cartharius</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Frech</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Grote</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Klocke</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Haltmeier</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Klingenhoff</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2005</year>). <article-title>MatInspector and beyond: Promoter Analysis Based on Transcription Factor Binding Sites</article-title>. <source>Bioinformatics</source> <volume>21</volume> (<issue>13</issue>), <fpage>2933</fpage>&#x2013;<lpage>2942</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bti473</pub-id> </citation>
</ref>
<ref id="B42">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Carroll</surname>
<given-names>K. J.</given-names>
</name>
<name>
<surname>North</surname>
<given-names>T. E.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Oceans of Opportunity: Exploring Vertebrate Hematopoiesis in zZebrafish</article-title>. <source>Exp. Hematol</source>. <volume>42</volume>, <fpage>684</fpage>&#x2013;<lpage>696</lpage>. </citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Davis</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Grondin</surname>
<given-names>C. J.</given-names>
</name>
<name>
<surname>Johnson</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Sciaky</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>McMorran</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Wiegers</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>The Comparative Toxicogenomics Database: Update 2019</article-title>. <source>Nucleic Acids Res.</source> <volume>47</volume> (<issue>D1</issue>), <fpage>D948</fpage>&#x2013;<lpage>D954</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gky868</pub-id> </citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>DePristo</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Banks</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Poplin</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Garimella</surname>
<given-names>K. V.</given-names>
</name>
<name>
<surname>Maguire</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Hartl</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>A Framework for Variation Discovery and Genotyping Using Next-Generation DNA Sequencing Data</article-title>. <source>Nat. Genet.</source> <volume>43</volume> (<issue>5</issue>), <fpage>491</fpage>&#x2013;<lpage>498</lpage>. <pub-id pub-id-type="doi">10.1038/ng.806</pub-id> </citation>
</ref>
<ref id="B43">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Duboc</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Dufourcq</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Blader</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Roussign&#x00E9;</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Asymmetry of the Brain: Development and Implications</article-title>. <source>Annu. Rev. Genet.</source> <volume>49</volume>, <fpage>647</fpage>&#x2013;<lpage>672</lpage>. </citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ewels</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Magnusson</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Lundin</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>K&#xe4;ller</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>MultiQC: Summarize Analysis Results for Multiple Tools and Samples in a Single Report</article-title>. <source>Bioinformatics</source> <volume>32</volume> (<issue>19</issue>), <fpage>3047</fpage>&#x2013;<lpage>3048</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btw354</pub-id> </citation>
</ref>
<ref id="B49">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Francois</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Koopman</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Beltrame</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>SoxF Genes: Key Players in the Development of the Cardio-Vascular System</article-title>. <source>Int. J. Biochem. Cell Biol</source>. <volume>42</volume>, <fpage>445</fpage>&#x2013;<lpage>448</lpage>. </citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Freedman</surname>
<given-names>M. L.</given-names>
</name>
<name>
<surname>Monteiro</surname>
<given-names>A. N. A.</given-names>
</name>
<name>
<surname>Gayther</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Coetzee</surname>
<given-names>G. A.</given-names>
</name>
<name>
<surname>Risch</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Plass</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>Principles for the Post-GWAS Functional Characterization of Cancer Risk Loci</article-title>. <source>Nat. Genet.</source> <volume>43</volume> (<issue>6</issue>), <fpage>513</fpage>&#x2013;<lpage>518</lpage>. <pub-id pub-id-type="doi">10.1038/ng.840</pub-id> </citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gamazon</surname>
<given-names>E. R.</given-names>
</name>
<name>
<surname>Perera</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Genome-Wide Approaches in Pharmacogenomics: Heritability Estimation and Pharmacoethnicity as Primary Challenges</article-title>. <source>Pharmacogenomics</source> <volume>13</volume> (<issue>10</issue>), <fpage>1101</fpage>&#x2013;<lpage>1104</lpage>. <pub-id pub-id-type="doi">10.2217/pgs.12.88</pub-id> </citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Garcia</surname>
<given-names>G. R.</given-names>
</name>
<name>
<surname>Bugel</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Truong</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Spagnoli</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Tanguay</surname>
<given-names>R. L.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>AHR2 Required for Normal Behavioral Responses and Proper Development of the Skeletal and Reproductive Systems in Zebrafish</article-title>. <source>Plos One</source> <volume>13</volume> (<issue>3</issue>), <fpage>e0193484</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0193484</pub-id> </citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Garcia</surname>
<given-names>G. R.</given-names>
</name>
<name>
<surname>Noyes</surname>
<given-names>P. D.</given-names>
</name>
<name>
<surname>Tanguay</surname>
<given-names>R. L.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Advancements in Zebrafish Applications for 21st Century Toxicology</article-title>. <source>Pharmacol. Ther.</source> <volume>161</volume>, <fpage>11</fpage>&#x2013;<lpage>21</lpage>. <pub-id pub-id-type="doi">10.1016/j.pharmthera.2016.03.009</pub-id> </citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<collab>Health Alert Network (HAN)</collab> (<year>2021</year>). <source>HAN Archive&#x2013;00449 &#x007C; Health Alert Network (HAN)</source>. <comment>Available at <ext-link ext-link-type="uri" xlink:href="https://emergency.cdc.gov/han/2021/han00449.asp">https://emergency.cdc.gov/han/2021/han00449.asp</ext-link>
</comment>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jerry</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Shull</surname>
<given-names>J. D.</given-names>
</name>
<name>
<surname>Hadsell</surname>
<given-names>D. L.</given-names>
</name>
<name>
<surname>Rijnkels</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Dunphy</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Schneider</surname>
<given-names>S. S.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Genetic Variation in Sensitivity to Estrogens and Breast Cancer Risk</article-title>. <source>Mamm. Genome</source> <volume>29</volume> (<issue>1&#x2013;2</issue>), <fpage>24</fpage>&#x2013;<lpage>37</lpage>. <pub-id pub-id-type="doi">10.1007/s00335-018-9741-z</pub-id> </citation>
</ref>
<ref id="B16">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Kimmel</surname>
<given-names>C. B.</given-names>
</name>
<name>
<surname>Ballard</surname>
<given-names>W. W.</given-names>
</name>
<name>
<surname>Kimmel</surname>
<given-names>S. R.</given-names>
</name>
<name>
<surname>Ullmann</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Schilling</surname>
<given-names>T. F.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title>Stages of Embryonic Development of the Zebrafish</article-title>. <source>Dev. Dyn.</source> <volume>203</volume>, <fpage>3</fpage>. </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kinch</surname>
<given-names>M. S.</given-names>
</name>
<name>
<surname>Haynesworth</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Kinch</surname>
<given-names>S. L.</given-names>
</name>
<name>
<surname>Hoyer</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>An Overview of FDA-Approved New Molecular Entities: 1827-2013</article-title>. <source>Drug Discov. Today</source> <volume>19</volume> (<issue>8</issue>), <fpage>1033</fpage>&#x2013;<lpage>1039</lpage>. <pub-id pub-id-type="doi">10.1016/j.drudis.2014.03.018</pub-id> </citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Le Marchand</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wilkens</surname>
<given-names>L. R.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Design Considerations for Genomic Association Studies: Importance of Gene-Environment Interactions</article-title>. <source>Cancer Epidemiol. Biomarkers Prev.</source> <volume>17</volume> (<issue>2</issue>), <fpage>263</fpage>&#x2013;<lpage>267</lpage>. <pub-id pub-id-type="doi">10.1158/1055-9965.EPI-07-0402</pub-id> </citation>
</ref>
<ref id="B47">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Zebrafish Embryos/larvae for Rapid Determination of Effects on Hypothalamic-Pituitary-Thyroid (HPT) and Hypothalamic-Pituitary-Interrenal (HPI) Axis: mRNA Expression</article-title>. <source>Chemosphere</source>. <volume>93</volume>, <fpage>2327</fpage>&#x2013;<lpage>2332</lpage>. </citation>
</ref>
<ref id="B44">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Lomel&#x00ED;</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Castillo-Castellanos</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Notch Signaling and the Emergence of Hematopoietic Stem Cells</article-title>. <source>Dev. Dyn</source>. <volume>249</volume>, <fpage>1302</fpage>&#x2013;<lpage>1317</lpage>. </citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mandrell</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Truong</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Jephson</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Sarker</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Moore</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lang</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>Automated Zebrafish Chorion Removal and Single Embryo Placement: Optimizing Throughput of Zebrafish Developmental Toxicity Screens</article-title>. <source>J. Lab. Autom.</source> <volume>17</volume> (<issue>1</issue>), <fpage>66&#x2013;74</fpage>. <pub-id pub-id-type="doi">10.1177/2211068211432197</pub-id> </citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>McAllister</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Mechanic</surname>
<given-names>L. E.</given-names>
</name>
<name>
<surname>Amos</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Aschard</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Blair</surname>
<given-names>I. A.</given-names>
</name>
<name>
<surname>Chatterjee</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Current Challenges and New Opportunities for Gene-Environment Interaction Studies of Complex Diseases</article-title>. <source>Am. J. Epidemiol.</source> <volume>186</volume> (<issue>7</issue>), <fpage>753</fpage>&#x2013;<lpage>761</lpage>. <pub-id pub-id-type="doi">10.1093/aje/kwx227</pub-id> </citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>McKenna</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hanna</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Banks</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Sivachenko</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Cibulskis</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Kernytsky</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2010</year>). <article-title>The Genome Analysis Toolkit: A MapReduce Framework for Analyzing Next-Generation DNA Sequencing Data</article-title>. <source>Genome Res.</source> <volume>20</volume> (<issue>9</issue>), <fpage>1297</fpage>&#x2013;<lpage>1303</lpage>. <pub-id pub-id-type="doi">10.1101/gr.107524.110</pub-id> </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mortensen</surname>
<given-names>H. M.</given-names>
</name>
<name>
<surname>Chamberlin</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Joubert</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Angrish</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Sipes</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>J. S.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Leveraging Human Genetic and Adverse Outcome Pathway (AOP) Data to Inform Susceptibility in Human Health Risk Assessment</article-title>. <source>Mamm. Genome</source> <volume>29</volume> (<issue>1&#x2013;2</issue>), <fpage>190</fpage>&#x2013;<lpage>204</lpage>. <pub-id pub-id-type="doi">10.1007/s00335-018-9738-7</pub-id> </citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mortensen</surname>
<given-names>H. M.</given-names>
</name>
<name>
<surname>Euling</surname>
<given-names>S. Y.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Integrating Mechanistic and Polymorphism Data to Characterize Human Genetic Susceptibility for Environmental Chemical Risk Assessment in the 21st Century</article-title>. <source>Toxicol. Appl. Pharmacol.</source> <volume>271</volume> (<issue>3</issue>), <fpage>395</fpage>&#x2013;<lpage>404</lpage>. <pub-id pub-id-type="doi">10.1016/j.taap.2011.01.015</pub-id> </citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Motsinger-Reif</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Jorgenson</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Relling</surname>
<given-names>M. V.</given-names>
</name>
<name>
<surname>Kroetz</surname>
<given-names>D. L.</given-names>
</name>
<name>
<surname>Weinshilboum</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Cox</surname>
<given-names>N. J.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Genome-wide Association Studies in Pharmacogenomics</article-title>. <source>Pharmacogenetics and Genomics</source> <volume>23</volume> (<issue>8</issue>), <fpage>383</fpage>&#x2013;<lpage>394</lpage>. <pub-id pub-id-type="doi">10.1097/FPC.0b013e32833d7b45</pub-id> </citation>
</ref>
<ref id="B24">
<citation citation-type="book">
<collab>National Research Council</collab> (<year>2009</year>). <source>Science and Decisions: Advancing Risk Assessment</source>. <publisher-loc>Washington, D.C.</publisher-loc>: <publisher-name>National Academies Press</publisher-name>, <fpage>12209</fpage>. <pub-id pub-id-type="doi">10.17226/12209</pub-id> </citation>
</ref>
<ref id="B46">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Pendeville</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Winandy</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Manfroid</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Nivelles</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Motte</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Pasque</surname>
<given-names>V.</given-names>
</name>
<etal/>
</person-group> (<year>2008</year>). <article-title>Zebrafish Sox7 and Sox18 Function Together to Control Arterial&#x2010;Venous Identity</article-title>. <source>Dev. Biol</source>. <volume>317</volume>, <fpage>405</fpage>&#x2013;<lpage>416</lpage>. </citation>
</ref>
<ref id="B25">
<citation citation-type="web">
<collab>Picard Tools - By Broad Institute</collab> (<year>2021</year>). <comment>Available at: <ext-link ext-link-type="uri" xlink:href="http://broadinstitute.github.io/picard/">http://broadinstitute.github.io/picard/</ext-link> (Accessed December 08, 2021)</comment>.</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Purcell</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Neale</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Todd-Brown</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Thomas</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Ferreira</surname>
<given-names>M. A. R.</given-names>
</name>
<name>
<surname>Bender</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2007</year>). <article-title>PLINK: A Tool Set for Whole-Genome Association and Population-Based Linkage Analyses</article-title>. <source>Am. J. Hum. Genet.</source> <volume>81</volume> (<issue>3</issue>), <fpage>559</fpage>&#x2013;<lpage>575</lpage>. <pub-id pub-id-type="doi">10.1086/519795</pub-id> </citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qin</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Tanis</surname>
<given-names>K. Q.</given-names>
</name>
<name>
<surname>Podtelezhnikov</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Glaab</surname>
<given-names>W. E.</given-names>
</name>
<name>
<surname>Sistare</surname>
<given-names>F. D.</given-names>
</name>
<name>
<surname>DeGeorge</surname>
<given-names>J. J.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Toxicogenomics in Drug Development: A Match Made in Heaven?</article-title> <source>Expert Opin. Drug Metab. Toxicol.</source> <volume>12</volume> (<issue>8</issue>), <fpage>847</fpage>&#x2013;<lpage>849</lpage>. <pub-id pub-id-type="doi">10.1080/17425255.2016.1175437</pub-id> </citation>
</ref>
<ref id="B28">
<citation citation-type="book">
<collab>R Core Team</collab> (<year>2020</year>). <source>R: A Language and Environment for Statistical Computing</source>. <publisher-loc>Vienna, Austria</publisher-loc>: <publisher-name>R Foundation for Statistical Computing</publisher-name>. </citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reif</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>Truong</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Mandrell</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Marvel</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Tanguay</surname>
<given-names>R. L.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>High-Throughput Characterization of Chemical-Associated Embryonic Behavioral Changes Predicts Teratogenic Outcomes</article-title>. <source>Arch. Toxicol.</source> <volume>90</volume> (<issue>6</issue>), <fpage>1459</fpage>&#x2013;<lpage>1470</lpage>. <pub-id pub-id-type="doi">10.1007/s00204-015-1554-1</pub-id> </citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Roden</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>Wilke</surname>
<given-names>R. A.</given-names>
</name>
<name>
<surname>Kroemer</surname>
<given-names>H. K.</given-names>
</name>
<name>
<surname>Stein</surname>
<given-names>C. M.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Pharmacogenomics</article-title>. <source>Circulation</source> <volume>123</volume> (<issue>15</issue>), <fpage>1661</fpage>&#x2013;<lpage>1670</lpage>. <pub-id pub-id-type="doi">10.1161/CIRCULATIONAHA.109.914820</pub-id> </citation>
</ref>
<ref id="B31">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Stovall</surname>
<given-names>D. B.</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Sui</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>SOX7: From a Developmental Regulator to an Emerging Tumor Suppressor</article-title>. <source>Histol. Histopathol.</source> <volume>29</volume> (<issue>4</issue>), <fpage>439</fpage>&#x2013;<lpage>445</lpage>. </citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Suter</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Babiss</surname>
<given-names>L. E.</given-names>
</name>
<name>
<surname>Wheeldon</surname>
<given-names>E. B.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Toxicogenomics in Predictive Toxicology in Drug Development</article-title>. <source>Chem. Biol.</source> <volume>11</volume> (<issue>2</issue>), <fpage>161</fpage>&#x2013;<lpage>171</lpage>. <pub-id pub-id-type="doi">10.1016/j.chembiol.2004.02.003</pub-id> </citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Truong</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Bugel</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Chlebowski</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Usenko</surname>
<given-names>C. Y.</given-names>
</name>
<name>
<surname>Simonich</surname>
<given-names>M. T.</given-names>
</name>
<name>
<surname>Simonich</surname>
<given-names>S. L. M.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Optimizing Multi-Dimensional High Throughput Screening Using Zebrafish</article-title>. <source>Reprod. Toxicol.</source> <volume>65</volume>, <fpage>139</fpage>&#x2013;<lpage>147</lpage>. <pub-id pub-id-type="doi">10.1016/j.reprotox.2016.05.015</pub-id> </citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Truong</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Harper</surname>
<given-names>S. L.</given-names>
</name>
<name>
<surname>Tanguay</surname>
<given-names>R. L.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Evaluation of Embryotoxicity Using the Zebrafish Model</article-title>. <source>Drug Saf. Eval.</source> <volume>691</volume>, <fpage>271</fpage>&#x2013;<lpage>279</lpage>. <pub-id pub-id-type="doi">10.1007/978-1-60761-849-2_16</pub-id> </citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Truong</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Reif</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>St Mary</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Geier</surname>
<given-names>M. C.</given-names>
</name>
<name>
<surname>Truong</surname>
<given-names>H. D.</given-names>
</name>
<name>
<surname>Tanguay</surname>
<given-names>R. L.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Multidimensional <italic>In Vivo</italic> Hazard Assessment Using Zebrafish</article-title>. <source>Toxicol. Sci.</source> <volume>137</volume> (<issue>1</issue>), <fpage>212</fpage>&#x2013;<lpage>233</lpage>. <pub-id pub-id-type="doi">10.1093/toxsci/kft235</pub-id> </citation>
</ref>
<ref id="B33">
<citation citation-type="book">
<collab>United States</collab> (<year>1986</year>). <source>Toxic Substances Control Act (TSCA) Chemical Substance Inventory</source>. <publisher-loc>Washington, D.C.</publisher-loc> <publisher-name>U.S. Environmental Protection Agency, Office of Toxic Substances.</publisher-name> </citation>
</ref>
<ref id="B48">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Vancamp</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Darras</surname>
<given-names>V. M.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>From Zebrafish to Human: A Comparative Approach to Elucidate the Role of the Thyroid Hormone Transporter MCT8 During Brain Development</article-title>. <source>Gen. Comp. Endocr.</source> <volume>265</volume>, <fpage>219</fpage>&#x2013;<lpage>229</lpage>. </citation>
</ref>
<ref id="B37">
<citation citation-type="web">
<collab>Zfin Gene</collab> (<year>2021</year>). <article-title>sox7</article-title>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://zfin.org/ZDB-GENE-040109-4#summary">https://zfin.org/ZDB-GENE-040109-4&#x23;summary</ext-link> (Accessed December 08, 2021)</comment>. </citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Roell</surname>
<given-names>K. R.</given-names>
</name>
<name>
<surname>Truong</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Tanguay</surname>
<given-names>R. L.</given-names>
</name>
<name>
<surname>Reif</surname>
<given-names>D. M.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>A Data-Driven Weighting Scheme for Multivariate Phenotypic Endpoints Recapitulates Zebrafish Developmental Cascades</article-title>. <source>Toxicol. Appl. Pharmacol.</source> <volume>314</volume>, <fpage>109</fpage>&#x2013;<lpage>117</lpage>. <pub-id pub-id-type="doi">10.1016/j.taap.2016.11.010</pub-id> </citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Luoma</surname>
<given-names>S. E.</given-names>
</name>
<name>
<surname>St. Armour</surname>
<given-names>G. E. G. E.</given-names>
</name>
<name>
<surname>Thakkar</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Mackay</surname>
<given-names>T. F. C.</given-names>
</name>
<name>
<surname>Anholt</surname>
<given-names>R. R. H.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>A Drosophila Model for Toxicogenomics: Genetic Variation in Susceptibility to Heavy Metal Exposure</article-title>. <source>Plos Genet.</source> <volume>13</volume> (<issue>7</issue>), <fpage>e1006907</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pgen.1006907</pub-id> </citation>
</ref>
</ref-list>
</back>
</article>